Seed: [42, 37, 8, 67, 52]
Alpha Value: 0.1
Learning Rate: 0.01
Discount Factor: 0.9
Number of Episodes: 50
Max Iterations: 500
Number of Batches: 5
Directory Path ./tests/mountaincar/alpha_0_1/
batch = 1
inside iterator
Iteration [  0  ]
Obj. val : -23.13358787772506, Avg. Ret : -19.64077448656745
Iteration [  1  ]
Obj. val : -23.15475225080538, Avg. Ret : -19.63589380044115
Iteration [  2  ]
Obj. val : -22.870517538828256, Avg. Ret : -19.59222771700629
Iteration [  3  ]
Obj. val : -22.93048856852109, Avg. Ret : -19.62178798858882
Iteration [  4  ]
Obj. val : -22.952341548199662, Avg. Ret : -19.813808478097627
Iteration [  5  ]
Obj. val : -23.543219534731545, Avg. Ret : -19.9042329582923
Iteration [  6  ]
Obj. val : -22.348075076351215, Avg. Ret : -19.614097006994573
Iteration [  7  ]
Obj. val : -22.710437817990158, Avg. Ret : -19.795268328504527
Iteration [  8  ]
Obj. val : -22.76310685496662, Avg. Ret : -19.846804584650215
Iteration [  9  ]
Obj. val : -23.176603321241647, Avg. Ret : -19.82612160641166
Iteration [  10  ]
Obj. val : -22.360639493241983, Avg. Ret : -19.91999721323878
Iteration [  11  ]
Obj. val : -23.089582558150727, Avg. Ret : -19.861296943503636
Iteration [  12  ]
Obj. val : -22.59557175178087, Avg. Ret : -19.657693343385535
Iteration [  13  ]
Obj. val : -22.83652602300446, Avg. Ret : -19.69311697160379
Iteration [  14  ]
Obj. val : -22.16903314625183, Avg. Ret : -19.879819517666817
Iteration [  15  ]
Obj. val : 50.03649972619161, Avg. Ret : -19.755518793313463
Iteration [  16  ]
Obj. val : -22.587340542611297, Avg. Ret : -19.927476666373526
Iteration [  17  ]
Obj. val : -22.36744288414799, Avg. Ret : -19.744779693768628
Iteration [  18  ]
Obj. val : -22.391623979413083, Avg. Ret : -19.664085845883193
Iteration [  19  ]
Obj. val : -21.976340935387633, Avg. Ret : -19.84049165439741
Iteration [  20  ]
Obj. val : -21.36247182406786, Avg. Ret : -37.228615199836014
Iteration [  21  ]
Obj. val : -22.660513306095595, Avg. Ret : -28.15014509121887
Iteration [  22  ]
Obj. val : -22.239363451643776, Avg. Ret : -18.048301544112118
Iteration [  23  ]
Obj. val : -21.998448202261805, Avg. Ret : -31.17083385431452
Iteration [  24  ]
Obj. val : -22.18659456007396, Avg. Ret : -26.78259784477039
Iteration [  25  ]
Obj. val : -21.947572049804513, Avg. Ret : -18.316665824390014
Iteration [  26  ]
Obj. val : -21.76371114310598, Avg. Ret : -17.207084226966728
Iteration [  27  ]
Obj. val : -21.73503478433356, Avg. Ret : -25.338787610387985
Iteration [  28  ]
Obj. val : 53.658666225214695, Avg. Ret : -24.34357954121078
Iteration [  29  ]
Obj. val : -21.679536065161052, Avg. Ret : -16.953045177403027
Iteration [  30  ]
Obj. val : -21.59475867341241, Avg. Ret : -17.436028970581663
Iteration [  31  ]
Obj. val : -21.615280882377704, Avg. Ret : -23.688696023370554
Iteration [  32  ]
Obj. val : -21.434307878482205, Avg. Ret : -23.15305508348209
Iteration [  33  ]
Obj. val : -21.841327930226516, Avg. Ret : -17.409113949589745
Iteration [  34  ]
Obj. val : -21.813132454926688, Avg. Ret : -22.570691076745515
Iteration [  35  ]
Obj. val : -21.4104103859917, Avg. Ret : -17.80630117471423
Iteration [  36  ]
Obj. val : -21.390962471000513, Avg. Ret : -22.212901283130172
Iteration [  37  ]
Obj. val : -21.39151739936083, Avg. Ret : -17.81709257341111
Iteration [  38  ]
Obj. val : -21.20717434162307, Avg. Ret : -22.04872094764969
Iteration [  39  ]
Obj. val : -21.48902053607356, Avg. Ret : -17.976686824353532
Iteration [  40  ]
Obj. val : -21.534183319692026, Avg. Ret : -24.87220715791652
Iteration [  41  ]
Obj. val : -21.126577933928026, Avg. Ret : -20.71711382296101
Iteration [  42  ]
Obj. val : -21.096960296848735, Avg. Ret : -19.165154397885434
Iteration [  43  ]
Obj. val : -20.719191340783013, Avg. Ret : -24.803166796070492
Iteration [  44  ]
Obj. val : -21.03046045260235, Avg. Ret : -20.259812441788355
Iteration [  45  ]
Obj. val : -20.9420072898924, Avg. Ret : -19.247555484418807
Iteration [  46  ]
Obj. val : -20.741889067607456, Avg. Ret : -24.49735363227152
Iteration [  47  ]
Obj. val : -20.71105010721301, Avg. Ret : -20.12047646794663
Iteration [  48  ]
Obj. val : -20.833224842390386, Avg. Ret : -19.194380471373265
Iteration [  49  ]
Obj. val : -20.963425250289855, Avg. Ret : -24.58709332143053
Iteration [  50  ]
Obj. val : -21.152269122303142, Avg. Ret : -19.581243875190456
Iteration [  51  ]
Obj. val : -20.928130004879023, Avg. Ret : -20.034401435514926
Iteration [  52  ]
Obj. val : -20.890793157958036, Avg. Ret : -24.480810162270508
Iteration [  53  ]
Obj. val : -20.803090882339852, Avg. Ret : -18.934637874002796
Iteration [  54  ]
Obj. val : -21.19830386418678, Avg. Ret : -19.76605880182643
Iteration [  55  ]
Obj. val : -20.382191392579283, Avg. Ret : -24.709381014286606
Iteration [  56  ]
Obj. val : -20.77702266428489, Avg. Ret : -19.66948597107168
Iteration [  57  ]
Obj. val : -21.087716414675718, Avg. Ret : -18.87016278425307
Iteration [  58  ]
Obj. val : -20.928141683017394, Avg. Ret : -24.27687606800755
Iteration [  59  ]
Obj. val : -19.753666138423664, Avg. Ret : -19.75974004737801
Iteration [  60  ]
Obj. val : -20.726500654170188, Avg. Ret : -18.722391890301825
Iteration [  61  ]
Obj. val : -20.908444406005827, Avg. Ret : -24.458336373819407
Iteration [  62  ]
Obj. val : -20.038922414818238, Avg. Ret : -20.1373092819607
Iteration [  63  ]
Obj. val : -21.126877747911752, Avg. Ret : -18.826003752103965
Iteration [  64  ]
Obj. val : -20.46276318044903, Avg. Ret : -24.48244648008572
Iteration [  65  ]
Obj. val : -20.455135545179612, Avg. Ret : -18.77906551123293
Iteration [  66  ]
Obj. val : -20.299780211817637, Avg. Ret : -19.917612744624627
Iteration [  67  ]
Obj. val : -20.571681008971193, Avg. Ret : -24.561592651977435
Iteration [  68  ]
Obj. val : -20.513580878277125, Avg. Ret : -18.763188232383868
Iteration [  69  ]
Obj. val : -20.003496789054704, Avg. Ret : -19.236672614521847
Iteration [  70  ]
Obj. val : -20.35372606459114, Avg. Ret : -24.22920931158913
Iteration [  71  ]
Obj. val : 52.48105526735271, Avg. Ret : -19.78372536853061
Iteration [  72  ]
Obj. val : -20.44168842144574, Avg. Ret : -18.822951661977164
Iteration [  73  ]
Obj. val : -20.398398819783385, Avg. Ret : -24.23985446547009
Iteration [  74  ]
Obj. val : -20.04857144501054, Avg. Ret : -18.771168148316043
Iteration [  75  ]
Obj. val : -20.022856522946267, Avg. Ret : -19.167621763395115
Iteration [  76  ]
Obj. val : -19.380056972248564, Avg. Ret : -24.09732215289379
Iteration [  77  ]
Obj. val : 51.98965418594812, Avg. Ret : -19.137445434564803
Iteration [  78  ]
Obj. val : -20.157240260724436, Avg. Ret : -18.839668076301034
Iteration [  79  ]
Obj. val : -19.839409056964982, Avg. Ret : -24.219719090974813
Iteration [  80  ]
Obj. val : -19.975339595025577, Avg. Ret : -19.030792184726415
Iteration [  81  ]
Obj. val : -20.120689616368413, Avg. Ret : -18.791941728533477
Iteration [  82  ]
Obj. val : -20.106800894902552, Avg. Ret : -23.979419341068976
Iteration [  83  ]
Obj. val : -20.086102290282046, Avg. Ret : -19.08117110233412
Iteration [  84  ]
Obj. val : -19.953057164940848, Avg. Ret : -18.86968610238714
Iteration [  85  ]
Obj. val : -20.233618008156217, Avg. Ret : -22.052080872393272
Iteration [  86  ]
Obj. val : -19.798410539037768, Avg. Ret : -19.036824941411474
Iteration [  87  ]
Obj. val : -19.991588547232364, Avg. Ret : -18.533887935575184
Iteration [  88  ]
Obj. val : -19.82652143326648, Avg. Ret : -24.379527371443515
Iteration [  89  ]
Obj. val : -19.962079663243273, Avg. Ret : -18.561087026439132
Iteration [  90  ]
Obj. val : -19.39520836245241, Avg. Ret : -19.569894522196616
Iteration [  91  ]
Obj. val : -19.52854234332167, Avg. Ret : -23.8781288979754
Iteration [  92  ]
Obj. val : -19.44466733740241, Avg. Ret : -18.77759725922947
Iteration [  93  ]
Obj. val : -19.720052703991875, Avg. Ret : -19.239499227795353
Iteration [  94  ]
Obj. val : -19.757019073425464, Avg. Ret : -23.94702135067618
Iteration [  95  ]
Obj. val : -19.39565766863541, Avg. Ret : -18.869646617396896
Iteration [  96  ]
Obj. val : -19.543186935478264, Avg. Ret : -19.087735380411768
Iteration [  97  ]
Obj. val : -19.639807517710967, Avg. Ret : -23.815466179498518
Iteration [  98  ]
Obj. val : -19.415195933590258, Avg. Ret : -18.93002026962471
Iteration [  99  ]
Obj. val : -19.423592652854985, Avg. Ret : -18.758999895934668
checkpoint for objective values, iteration: 100. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_1.csv
checkpoint for avg return values, iteration: 100. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_1.csv
Iteration [  100  ]
Obj. val : -19.687410116524546, Avg. Ret : -23.773089330970066
Iteration [  101  ]
Obj. val : -19.365623875668298, Avg. Ret : -18.9901033001643
Iteration [  102  ]
Obj. val : -19.450085879448707, Avg. Ret : -18.572651432145598
Iteration [  103  ]
Obj. val : -19.154407066777324, Avg. Ret : -23.875032825348896
Iteration [  104  ]
Obj. val : -19.702081205064147, Avg. Ret : -18.931096424178936
Iteration [  105  ]
Obj. val : -19.69223973131581, Avg. Ret : -18.679260920494432
Iteration [  106  ]
Obj. val : -19.716841732532867, Avg. Ret : -23.6670669512844
Iteration [  107  ]
Obj. val : -19.29732343028999, Avg. Ret : -18.875145083930157
Iteration [  108  ]
Obj. val : -19.70925811249053, Avg. Ret : -18.442033056372644
Iteration [  109  ]
Obj. val : -18.997189404709765, Avg. Ret : -23.678264938408383
Iteration [  110  ]
Obj. val : -19.43055519991267, Avg. Ret : -18.47503169075801
Iteration [  111  ]
Obj. val : -19.291103239085164, Avg. Ret : -19.08989847803538
Iteration [  112  ]
Obj. val : -19.24282536143732, Avg. Ret : -23.681006410985745
Iteration [  113  ]
Obj. val : -19.25055993499543, Avg. Ret : -19.17799432737217
Iteration [  114  ]
Obj. val : -18.950778096617192, Avg. Ret : -18.47855030750988
Iteration [  115  ]
Obj. val : -18.491090506172885, Avg. Ret : -23.476967985528344
Iteration [  116  ]
Obj. val : -19.16521612126691, Avg. Ret : -18.94649260990479
Iteration [  117  ]
Obj. val : -18.74374858348891, Avg. Ret : -18.386494141223565
Iteration [  118  ]
Obj. val : -19.118020688185982, Avg. Ret : -23.37662074609753
Iteration [  119  ]
Obj. val : -18.74618694497614, Avg. Ret : -19.26625764074923
Iteration [  120  ]
Obj. val : -18.799106753140805, Avg. Ret : -18.26592467531099
Iteration [  121  ]
Obj. val : -19.2836592817335, Avg. Ret : -23.314569784421646
Iteration [  122  ]
Obj. val : -19.28644896499877, Avg. Ret : -18.564760344134086
Iteration [  123  ]
Obj. val : -19.18741495548642, Avg. Ret : -19.251755863462936
Iteration [  124  ]
Obj. val : -19.135064135916128, Avg. Ret : -21.502277099632227
Iteration [  125  ]
Obj. val : -18.808770171830073, Avg. Ret : -19.02800688093303
Iteration [  126  ]
Obj. val : -18.819198358225705, Avg. Ret : -18.57456699458384
Iteration [  127  ]
Obj. val : -19.408732090621662, Avg. Ret : -23.49664621608497
Iteration [  128  ]
Obj. val : -19.014398887946985, Avg. Ret : -19.07290649694079
Iteration [  129  ]
Obj. val : -19.13642230120643, Avg. Ret : -18.252519885531637
Iteration [  130  ]
Obj. val : -19.15204191794893, Avg. Ret : -23.22701960851512
Iteration [  131  ]
Obj. val : -19.18945244707836, Avg. Ret : -19.006301297916615
Iteration [  132  ]
Obj. val : -18.910253977775177, Avg. Ret : -18.376924616554657
Iteration [  133  ]
Obj. val : -19.239073920216782, Avg. Ret : -23.406109052595333
Iteration [  134  ]
Obj. val : -19.31429777893559, Avg. Ret : -18.397422779150716
Iteration [  135  ]
Obj. val : -18.81156172051689, Avg. Ret : -18.931322477269326
Iteration [  136  ]
Obj. val : -19.81297683338377, Avg. Ret : -23.450377181574417
Iteration [  137  ]
Obj. val : -19.626400010531672, Avg. Ret : -18.39947563138912
Iteration [  138  ]
Obj. val : -19.339673614094576, Avg. Ret : -19.196169034290698
Iteration [  139  ]
Obj. val : -19.854488474950035, Avg. Ret : -23.147204876264112
Iteration [  140  ]
Obj. val : -19.60675150855255, Avg. Ret : -18.29563883895922
Iteration [  141  ]
Obj. val : -20.149951977335572, Avg. Ret : -19.222032962541434
Iteration [  142  ]
Obj. val : -19.899592156034373, Avg. Ret : -23.20405805324249
Iteration [  143  ]
Obj. val : -19.901433203541885, Avg. Ret : -19.54771914688717
Iteration [  144  ]
Obj. val : -20.050400438654425, Avg. Ret : -18.470584268355754
Iteration [  145  ]
Obj. val : -20.110478760481758, Avg. Ret : -22.847069644937104
Iteration [  146  ]
Obj. val : -19.914341921135815, Avg. Ret : -18.078632425070126
Iteration [  147  ]
Obj. val : -20.693795116560878, Avg. Ret : -19.232280975014017
Iteration [  148  ]
Obj. val : -20.4740958192386, Avg. Ret : -23.278682604606164
Iteration [  149  ]
Obj. val : -20.59249591862, Avg. Ret : -18.304385678442305
Iteration [  150  ]
Obj. val : -20.991888707877138, Avg. Ret : -18.7044168670667
Iteration [  151  ]
Obj. val : -20.777031688933228, Avg. Ret : -23.0994140274624
Iteration [  152  ]
Obj. val : -21.01127491060229, Avg. Ret : -18.718619920049957
Iteration [  153  ]
Obj. val : -20.88834936851781, Avg. Ret : -18.4002099660744
Iteration [  154  ]
Obj. val : -21.144631954032647, Avg. Ret : -23.136948037621764
Iteration [  155  ]
Obj. val : -21.097139510932532, Avg. Ret : -18.32746002494753
Iteration [  156  ]
Obj. val : -20.896893011252516, Avg. Ret : -18.906773686072693
Iteration [  157  ]
Obj. val : -21.32864085728231, Avg. Ret : -23.056503842036573
Iteration [  158  ]
Obj. val : -21.404746432367848, Avg. Ret : -19.003066527599437
Iteration [  159  ]
Obj. val : -21.0546560680018, Avg. Ret : -18.049318614099263
Iteration [  160  ]
Obj. val : -21.382104564559338, Avg. Ret : -22.977116915336545
Iteration [  161  ]
Obj. val : -21.742540693010238, Avg. Ret : -18.493872976488827
Iteration [  162  ]
Obj. val : -22.090377969489992, Avg. Ret : -18.48168860182326
Iteration [  163  ]
Obj. val : -21.619518437817227, Avg. Ret : -22.9793936803477
Iteration [  164  ]
Obj. val : -21.770033555948505, Avg. Ret : -18.8495845789701
Iteration [  165  ]
Obj. val : -21.51591123033811, Avg. Ret : -18.29098400520063
Iteration [  166  ]
Obj. val : -22.448290181819043, Avg. Ret : -22.88006390331184
Iteration [  167  ]
Obj. val : -22.61097841391534, Avg. Ret : -18.154355628061186
Iteration [  168  ]
Obj. val : -22.387499711979096, Avg. Ret : -18.563168825047214
Iteration [  169  ]
Obj. val : -22.782602941818965, Avg. Ret : -22.558179972650745
Iteration [  170  ]
Obj. val : -22.889450738432647, Avg. Ret : -18.429606114415513
Iteration [  171  ]
Obj. val : -22.51208013354081, Avg. Ret : -18.32227304527678
Iteration [  172  ]
Obj. val : -22.918588728406807, Avg. Ret : -22.75083739247668
Iteration [  173  ]
Obj. val : -23.078524460111684, Avg. Ret : -18.89929467433324
Iteration [  174  ]
Obj. val : -22.16036738760424, Avg. Ret : -18.371496024663806
Iteration [  175  ]
Obj. val : -23.103783454596904, Avg. Ret : -22.61688808135908
Iteration [  176  ]
Obj. val : -22.93211336961728, Avg. Ret : -19.49792203335786
Iteration [  177  ]
Obj. val : -22.629358204913387, Avg. Ret : -17.839660741658435
Iteration [  178  ]
Obj. val : -23.47310147240644, Avg. Ret : -22.676928395655512
Iteration [  179  ]
Obj. val : -23.345084109281732, Avg. Ret : -18.659679103905884
Iteration [  180  ]
Obj. val : -23.387416560460412, Avg. Ret : -18.429874331412513
Iteration [  181  ]
Obj. val : -23.75612423135732, Avg. Ret : -22.562828504608337
Iteration [  182  ]
Obj. val : -23.231734829257796, Avg. Ret : -17.990566553796985
Iteration [  183  ]
Obj. val : -24.561940910812552, Avg. Ret : -19.2425756124497
Iteration [  184  ]
Obj. val : -24.060660810935403, Avg. Ret : -22.71243596351389
Iteration [  185  ]
Obj. val : -23.00129043974534, Avg. Ret : -18.385459431642502
Iteration [  186  ]
Obj. val : -24.203652994827994, Avg. Ret : -18.505279728525885
Iteration [  187  ]
Obj. val : -23.71056873056795, Avg. Ret : -22.50760051679199
Iteration [  188  ]
Obj. val : -24.279794825311452, Avg. Ret : -18.418749438097624
Iteration [  189  ]
Obj. val : -23.990109608210023, Avg. Ret : -18.4397113701389
Iteration [  190  ]
Obj. val : -24.5053556632077, Avg. Ret : -22.623458044900563
Iteration [  191  ]
Obj. val : -24.442068598113522, Avg. Ret : -18.747490530462272
Iteration [  192  ]
Obj. val : -24.596165153099133, Avg. Ret : -18.040538966221504
Iteration [  193  ]
Obj. val : -24.69445902570053, Avg. Ret : -22.50308051373908
Iteration [  194  ]
Obj. val : -24.34610241785926, Avg. Ret : -18.99922366380082
Iteration [  195  ]
Obj. val : -24.885089715183803, Avg. Ret : -18.381869935444257
Iteration [  196  ]
Obj. val : -24.945749910333223, Avg. Ret : -22.548186484393238
Iteration [  197  ]
Obj. val : -24.65824590522337, Avg. Ret : -18.920537908230585
Iteration [  198  ]
Obj. val : -25.132249954324664, Avg. Ret : -17.711616127416068
Iteration [  199  ]
Obj. val : -24.683177152500235, Avg. Ret : -22.414856875242368
checkpoint for objective values, iteration: 200. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_1.csv
checkpoint for avg return values, iteration: 200. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_1.csv
Iteration [  200  ]
Obj. val : -24.914983065991763, Avg. Ret : -17.734954680004726
Iteration [  201  ]
Obj. val : -25.182491517501425, Avg. Ret : -19.16545940661348
Iteration [  202  ]
Obj. val : -25.263938079920766, Avg. Ret : -22.453206998446355
Iteration [  203  ]
Obj. val : -24.90925458838735, Avg. Ret : -19.321082759542506
Iteration [  204  ]
Obj. val : -25.87021438954349, Avg. Ret : -18.466069611356644
Iteration [  205  ]
Obj. val : -25.22539890712654, Avg. Ret : -22.52432157793079
Iteration [  206  ]
Obj. val : -25.6017211864792, Avg. Ret : -18.23471902685027
Iteration [  207  ]
Obj. val : -25.564609243240007, Avg. Ret : -18.677819139398046
Iteration [  208  ]
Obj. val : -25.27269662937848, Avg. Ret : -22.14944010233991
Iteration [  209  ]
Obj. val : -24.89905732864928, Avg. Ret : -18.045537721244244
Iteration [  210  ]
Obj. val : -25.957089401882943, Avg. Ret : -18.934306284519877
Iteration [  211  ]
Obj. val : -25.776762648261386, Avg. Ret : -22.43657423117647
Iteration [  212  ]
Obj. val : -25.372690467484446, Avg. Ret : -17.991294615538553
Iteration [  213  ]
Obj. val : -26.315747986226235, Avg. Ret : -18.812872334186494
Iteration [  214  ]
Obj. val : -25.85798961094545, Avg. Ret : -22.164690337051688
Iteration [  215  ]
Obj. val : -26.271675687388502, Avg. Ret : -17.926146684822484
Iteration [  216  ]
Obj. val : -26.183276010380155, Avg. Ret : -18.576212409195456
Iteration [  217  ]
Obj. val : -26.200054063117655, Avg. Ret : -22.058350805098467
Iteration [  218  ]
Obj. val : -25.829375792084136, Avg. Ret : -18.098617943525106
Iteration [  219  ]
Obj. val : -26.27020229746529, Avg. Ret : -18.451347811299645
Iteration [  220  ]
Obj. val : -26.61459625173494, Avg. Ret : -22.255012484560954
Iteration [  221  ]
Obj. val : -26.3917674120612, Avg. Ret : -17.976960741409002
Iteration [  222  ]
Obj. val : -26.365697313488024, Avg. Ret : -18.391690460126263
Iteration [  223  ]
Obj. val : -26.890824441650466, Avg. Ret : -22.039996493337018
Iteration [  224  ]
Obj. val : -26.426265613208187, Avg. Ret : -18.150870041725046
Iteration [  225  ]
Obj. val : -26.736153800946344, Avg. Ret : -17.923032484207685
Iteration [  226  ]
Obj. val : -26.907804262206657, Avg. Ret : -22.104631708232983
Iteration [  227  ]
Obj. val : -26.643565276236675, Avg. Ret : -18.321543930810506
Iteration [  228  ]
Obj. val : -26.779164494805517, Avg. Ret : -18.395336094863477
Iteration [  229  ]
Obj. val : -26.427517613790656, Avg. Ret : -22.07967818231184
Iteration [  230  ]
Obj. val : -26.483725558016648, Avg. Ret : -17.65799552859033
Iteration [  231  ]
Obj. val : -26.855387667621297, Avg. Ret : -18.777702984662348
Iteration [  232  ]
Obj. val : -27.254849449890298, Avg. Ret : -22.104192256962378
Iteration [  233  ]
Obj. val : -27.17595931000713, Avg. Ret : -18.43935513672396
Iteration [  234  ]
Obj. val : -27.02321776525652, Avg. Ret : -17.81215342266614
Iteration [  235  ]
Obj. val : -26.999137283280614, Avg. Ret : -21.944752510756175
Iteration [  236  ]
Obj. val : -27.253681627580047, Avg. Ret : -18.04299544698757
Iteration [  237  ]
Obj. val : -27.127327313040777, Avg. Ret : -18.40712684272479
Iteration [  238  ]
Obj. val : -27.30324250619793, Avg. Ret : -21.88807253455299
Iteration [  239  ]
Obj. val : -26.806643098272676, Avg. Ret : -18.385973648063977
Iteration [  240  ]
Obj. val : -27.788785095049963, Avg. Ret : -18.020451846881848
Iteration [  241  ]
Obj. val : -27.422682231942957, Avg. Ret : -21.970644930558286
Iteration [  242  ]
Obj. val : -27.296011065703947, Avg. Ret : -18.34907524443906
Iteration [  243  ]
Obj. val : -27.438601382331598, Avg. Ret : -17.988606800914507
Iteration [  244  ]
Obj. val : -27.585653111834624, Avg. Ret : -22.068579166618637
Iteration [  245  ]
Obj. val : -27.225084639079547, Avg. Ret : -17.99818078360281
Iteration [  246  ]
Obj. val : -27.552077795873508, Avg. Ret : -18.254056048706012
Iteration [  247  ]
Obj. val : -27.550969421148558, Avg. Ret : -21.830616584202506
Iteration [  248  ]
Obj. val : -27.176579778783392, Avg. Ret : -18.489145091685995
Iteration [  249  ]
Obj. val : -27.492110088478825, Avg. Ret : -17.613891676071244
Iteration [  250  ]
Obj. val : -27.519871768384302, Avg. Ret : -21.57945274412558
Iteration [  251  ]
Obj. val : -27.063715172652564, Avg. Ret : -18.418751888005737
Iteration [  252  ]
Obj. val : -27.667287141833555, Avg. Ret : -17.76935770679111
Iteration [  253  ]
Obj. val : -28.17759814857092, Avg. Ret : -19.77869266588505
Iteration [  254  ]
Obj. val : -27.82894809487784, Avg. Ret : -18.94676733589284
Iteration [  255  ]
Obj. val : -27.54554359736155, Avg. Ret : -17.990023826861947
Iteration [  256  ]
Obj. val : -27.938573893543047, Avg. Ret : -21.929909124568102
Iteration [  257  ]
Obj. val : -27.20328214022602, Avg. Ret : -18.438267581173506
Iteration [  258  ]
Obj. val : -27.37701882076164, Avg. Ret : -17.533458396607564
Iteration [  259  ]
Obj. val : -27.895807230893865, Avg. Ret : -21.822606272799867
Iteration [  260  ]
Obj. val : -27.87819318548873, Avg. Ret : -18.104478814902365
Iteration [  261  ]
Obj. val : -28.24688261304594, Avg. Ret : -19.26207922068308
Iteration [  262  ]
Obj. val : -28.29016428612597, Avg. Ret : -21.818681793954696
Iteration [  263  ]
Obj. val : 45.80622820287374, Avg. Ret : -18.24154902189679
Iteration [  264  ]
Obj. val : -28.090467391261342, Avg. Ret : -19.62634006257867
Iteration [  265  ]
Obj. val : -27.923409582123185, Avg. Ret : -21.676923052104982
Iteration [  266  ]
Obj. val : -27.827277401060773, Avg. Ret : -17.810897977956564
Iteration [  267  ]
Obj. val : -27.979445616526775, Avg. Ret : -18.73749208056509
Iteration [  268  ]
Obj. val : -28.262251711711134, Avg. Ret : -21.575148301457112
Iteration [  269  ]
Obj. val : -28.30164455426842, Avg. Ret : -17.81256417081424
Iteration [  270  ]
Obj. val : -28.20729874260096, Avg. Ret : -18.93360202471608
Iteration [  271  ]
Obj. val : -27.9277885084355, Avg. Ret : -19.708294304241782
Iteration [  272  ]
Obj. val : -28.580751339755963, Avg. Ret : -20.396287938038114
Iteration [  273  ]
Obj. val : -28.439899550707487, Avg. Ret : -17.831666434601065
Iteration [  274  ]
Obj. val : -28.53703586753029, Avg. Ret : -21.7269132497594
Iteration [  275  ]
Obj. val : -28.459039821421825, Avg. Ret : -17.922869125909898
Iteration [  276  ]
Obj. val : -28.233297241019407, Avg. Ret : -18.730792776996598
Iteration [  277  ]
Obj. val : -28.545112468192396, Avg. Ret : -21.673497476322837
Iteration [  278  ]
Obj. val : -28.42276089918987, Avg. Ret : -17.718926818704976
Iteration [  279  ]
Obj. val : -28.51635105939343, Avg. Ret : -18.983131983089155
Iteration [  280  ]
Obj. val : -28.881408673632972, Avg. Ret : -21.655558585448425
Iteration [  281  ]
Obj. val : -28.57437815186042, Avg. Ret : -18.205192125301565
Iteration [  282  ]
Obj. val : -28.695971059743236, Avg. Ret : -17.666615686225136
Iteration [  283  ]
Obj. val : -28.890475330213306, Avg. Ret : -21.65295039936616
Iteration [  284  ]
Obj. val : -28.808414133051652, Avg. Ret : -17.711769779607653
Iteration [  285  ]
Obj. val : -29.00207928259123, Avg. Ret : -18.57892449170479
Iteration [  286  ]
Obj. val : -28.47788474953392, Avg. Ret : -21.390087615196872
Iteration [  287  ]
Obj. val : -28.62078716039003, Avg. Ret : -18.0225167996134
Iteration [  288  ]
Obj. val : -28.64853763700494, Avg. Ret : -17.77804377106125
Iteration [  289  ]
Obj. val : -28.749870844046754, Avg. Ret : -21.669222173786203
Iteration [  290  ]
Obj. val : -28.286378685914766, Avg. Ret : -18.28120058038871
Iteration [  291  ]
Obj. val : -29.079642939813745, Avg. Ret : -17.704084771988793
Iteration [  292  ]
Obj. val : -29.546782135947584, Avg. Ret : -21.27508512391819
Iteration [  293  ]
Obj. val : -29.374798220529453, Avg. Ret : -17.81796239867961
Iteration [  294  ]
Obj. val : -29.17512993445967, Avg. Ret : -17.92244345195848
Iteration [  295  ]
Obj. val : -28.979667177077705, Avg. Ret : -21.715223118296553
Iteration [  296  ]
Obj. val : -28.885073973629876, Avg. Ret : -17.84256188427954
Iteration [  297  ]
Obj. val : -29.38086496715935, Avg. Ret : -17.60578728840414
Iteration [  298  ]
Obj. val : -29.337520685998395, Avg. Ret : -21.385850806997674
Iteration [  299  ]
Obj. val : -29.171550589701344, Avg. Ret : -17.850584922879044
checkpoint for objective values, iteration: 300. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_1.csv
checkpoint for avg return values, iteration: 300. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_1.csv
Iteration [  300  ]
Obj. val : -28.90752764661482, Avg. Ret : -17.5984621730988
Iteration [  301  ]
Obj. val : -28.95385878701343, Avg. Ret : -21.497763588956207
Iteration [  302  ]
Obj. val : -29.26089743718711, Avg. Ret : -17.919168319249167
Iteration [  303  ]
Obj. val : -29.414233355817228, Avg. Ret : -19.08219306150734
Iteration [  304  ]
Obj. val : -28.893968821873393, Avg. Ret : -21.352194868642005
Iteration [  305  ]
Obj. val : -29.3515466975045, Avg. Ret : -17.66748195867218
Iteration [  306  ]
Obj. val : -29.371549078177743, Avg. Ret : -18.61068977263799
Iteration [  307  ]
Obj. val : -29.045453728892635, Avg. Ret : -21.289331911833266
Iteration [  308  ]
Obj. val : -29.40057784480622, Avg. Ret : -19.749636404581125
Iteration [  309  ]
Obj. val : -29.18614172843077, Avg. Ret : -18.183799581881225
Iteration [  310  ]
Obj. val : -29.25700737183196, Avg. Ret : -21.376265215998597
Iteration [  311  ]
Obj. val : -29.25287463758187, Avg. Ret : -18.546388573234413
Iteration [  312  ]
Obj. val : -29.29982691634573, Avg. Ret : -20.1557346418396
Iteration [  313  ]
Obj. val : -29.390395848222653, Avg. Ret : -21.088258037274095
Iteration [  314  ]
Obj. val : -29.60788258665634, Avg. Ret : -20.875955892525127
Iteration [  315  ]
Obj. val : -29.11772835868151, Avg. Ret : -18.833660489245396
Iteration [  316  ]
Obj. val : -28.668806726404416, Avg. Ret : -21.131341236609213
Iteration [  317  ]
Obj. val : -29.2401597063566, Avg. Ret : -21.001921904842966
Iteration [  318  ]
Obj. val : -29.126104670178133, Avg. Ret : -19.651885620885192
Iteration [  319  ]
Obj. val : -29.302405469966214, Avg. Ret : -21.11924524974167
Iteration [  320  ]
Obj. val : -29.51877454476255, Avg. Ret : -20.420457728720674
Iteration [  321  ]
Obj. val : -29.565619367657384, Avg. Ret : -18.910671046963074
Iteration [  322  ]
Obj. val : -29.4877289208682, Avg. Ret : -21.12169987682382
Iteration [  323  ]
Obj. val : -29.17169351428332, Avg. Ret : -18.495844944905773
Iteration [  324  ]
Obj. val : -29.42004228405196, Avg. Ret : -20.620967829327927
Iteration [  325  ]
Obj. val : -29.243973823136237, Avg. Ret : -21.163406390065447
Iteration [  326  ]
Obj. val : -29.021368810029227, Avg. Ret : -18.545624659155102
Iteration [  327  ]
Obj. val : -29.396282019870007, Avg. Ret : -19.22252920648611
Iteration [  328  ]
Obj. val : -29.486795967352148, Avg. Ret : -21.18618177459005
Iteration [  329  ]
Obj. val : -29.585954009722553, Avg. Ret : -17.570338073630044
Iteration [  330  ]
Obj. val : -29.495727048016573, Avg. Ret : -19.72640012862035
Iteration [  331  ]
Obj. val : -29.68533485848362, Avg. Ret : -21.13942062143867
Iteration [  332  ]
Obj. val : -29.45234459400441, Avg. Ret : -17.640553250966644
Iteration [  333  ]
Obj. val : -30.12744227072481, Avg. Ret : -17.773469667500443
Iteration [  334  ]
Obj. val : -29.241913067280816, Avg. Ret : -20.85723990915053
Iteration [  335  ]
Obj. val : -29.371446211841516, Avg. Ret : -18.468860384100598
Iteration [  336  ]
Obj. val : -29.614324028773535, Avg. Ret : -17.352388266779098
Iteration [  337  ]
Obj. val : -29.256718591667475, Avg. Ret : -20.982294246432986
Iteration [  338  ]
Obj. val : -29.11955211657891, Avg. Ret : -18.646103991031566
Iteration [  339  ]
Obj. val : -29.741114319356974, Avg. Ret : -19.82540068515842
Iteration [  340  ]
Obj. val : -29.428756349987427, Avg. Ret : -21.030335901636004
Iteration [  341  ]
Obj. val : -29.982333887678845, Avg. Ret : -19.29547603167235
Iteration [  342  ]
Obj. val : -29.676887606534983, Avg. Ret : -18.517604909461394
Iteration [  343  ]
Obj. val : -29.070081491762835, Avg. Ret : -20.971516884833953
Iteration [  344  ]
Obj. val : -29.4783960846858, Avg. Ret : -18.759719333564732
Iteration [  345  ]
Obj. val : -29.521292900549238, Avg. Ret : -17.346202101444717
Iteration [  346  ]
Obj. val : -30.019879373871103, Avg. Ret : -20.919134610078277
Iteration [  347  ]
Obj. val : -29.316871639493165, Avg. Ret : -19.917561263919076
Iteration [  348  ]
Obj. val : -29.82973610770935, Avg. Ret : -18.065477620718806
Iteration [  349  ]
Obj. val : -29.208711029335824, Avg. Ret : -20.96230745232425
Iteration [  350  ]
Obj. val : -29.768850378310848, Avg. Ret : -19.952647375180213
Iteration [  351  ]
Obj. val : -29.645394125667373, Avg. Ret : -18.686502166821366
Iteration [  352  ]
Obj. val : -28.884087607109837, Avg. Ret : -20.89983259250677
Iteration [  353  ]
Obj. val : -29.746342299982555, Avg. Ret : -21.08491984693051
Iteration [  354  ]
Obj. val : -29.29356716868688, Avg. Ret : -18.464386344817452
Iteration [  355  ]
Obj. val : -30.22716546862008, Avg. Ret : -21.086284896623294
Iteration [  356  ]
Obj. val : -29.67527412234036, Avg. Ret : -18.91295256225845
Iteration [  357  ]
Obj. val : -28.808395775561355, Avg. Ret : -17.76412201328694
Iteration [  358  ]
Obj. val : -29.48744430392859, Avg. Ret : -20.89158183189328
Iteration [  359  ]
Obj. val : -29.24300288049342, Avg. Ret : -18.479086413667645
Iteration [  360  ]
Obj. val : -29.387649926392495, Avg. Ret : -17.598782332333045
Iteration [  361  ]
Obj. val : -29.460303463992904, Avg. Ret : -20.835772897122524
Iteration [  362  ]
Obj. val : -29.434153743834965, Avg. Ret : -18.186561906885803
Iteration [  363  ]
Obj. val : -29.426206733003465, Avg. Ret : -17.417342557207586
Iteration [  364  ]
Obj. val : -29.60735296384383, Avg. Ret : -20.976991765229826
Iteration [  365  ]
Obj. val : -29.670566018546328, Avg. Ret : -18.168857002222467
Iteration [  366  ]
Obj. val : -29.442319160459544, Avg. Ret : -19.3489759051052
Iteration [  367  ]
Obj. val : -30.04149308071973, Avg. Ret : -20.598202908827467
Iteration [  368  ]
Obj. val : -28.787333751142697, Avg. Ret : -19.96293192101865
Iteration [  369  ]
Obj. val : -29.517760719752143, Avg. Ret : -17.94975026087769
Iteration [  370  ]
Obj. val : -29.45747373118284, Avg. Ret : -20.75043778217246
Iteration [  371  ]
Obj. val : -29.672883407027552, Avg. Ret : -17.222451761476748
Iteration [  372  ]
Obj. val : -29.305900997147127, Avg. Ret : -18.746277343263195
Iteration [  373  ]
Obj. val : -29.46678064737163, Avg. Ret : -20.696113176616738
Iteration [  374  ]
Obj. val : -29.77362634862011, Avg. Ret : -18.016904810621817
Iteration [  375  ]
Obj. val : -29.443926655835355, Avg. Ret : -17.1845345078368
Iteration [  376  ]
Obj. val : -29.60008955533754, Avg. Ret : -20.611814157138056
Iteration [  377  ]
Obj. val : -29.49645245271213, Avg. Ret : -17.46714899854653
Iteration [  378  ]
Obj. val : -29.383597447934072, Avg. Ret : -18.320222342766034
Iteration [  379  ]
Obj. val : -29.21995488247787, Avg. Ret : -20.7936407273563
Iteration [  380  ]
Obj. val : -29.23275840294178, Avg. Ret : -15.806455779607694
Iteration [  381  ]
Obj. val : -29.383586580620694, Avg. Ret : -17.320213083711163
Iteration [  382  ]
Obj. val : -29.399708562318935, Avg. Ret : -20.834479551307695
Iteration [  383  ]
Obj. val : -29.31847425478025, Avg. Ret : -45.10641608369243
Iteration [  384  ]
Obj. val : -30.03695361495415, Avg. Ret : -46.28230686708477
Iteration [  385  ]
Obj. val : -29.847485647668943, Avg. Ret : -20.566565855127145
Iteration [  386  ]
Obj. val : -29.308624861705944, Avg. Ret : -46.303936460702225
Iteration [  387  ]
Obj. val : -29.26806668475373, Avg. Ret : -27.69508282017934
Iteration [  388  ]
Obj. val : -29.16780924035153, Avg. Ret : -20.63926097743882
Iteration [  389  ]
Obj. val : -29.479434794633644, Avg. Ret : -44.1448522469497
Iteration [  390  ]
Obj. val : -29.50641736701797, Avg. Ret : -44.45449412944721
Iteration [  391  ]
Obj. val : -29.27403519764854, Avg. Ret : -20.64229900295771
Iteration [  392  ]
Obj. val : -29.014439128120586, Avg. Ret : -44.19779932388867
Iteration [  393  ]
Obj. val : -29.407543727300837, Avg. Ret : -44.07006126763723
Iteration [  394  ]
Obj. val : -28.93771486213399, Avg. Ret : -20.488584081172302
Iteration [  395  ]
Obj. val : -29.545579328866626, Avg. Ret : -46.28019533449974
Iteration [  396  ]
Obj. val : -29.358534161223915, Avg. Ret : -40.81561138957822
Iteration [  397  ]
Obj. val : -29.268122504105342, Avg. Ret : -20.45264779544846
Iteration [  398  ]
Obj. val : -29.127111712415704, Avg. Ret : -42.87412860199141
Iteration [  399  ]
Obj. val : -29.326680337188936, Avg. Ret : -41.625431648868265
checkpoint for objective values, iteration: 400. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_1.csv
checkpoint for avg return values, iteration: 400. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_1.csv
Iteration [  400  ]
Obj. val : -28.636260894597797, Avg. Ret : -20.500360456042554
Iteration [  401  ]
Obj. val : -29.49285171216677, Avg. Ret : -46.15503433414173
Iteration [  402  ]
Obj. val : -29.112559627456847, Avg. Ret : -41.33193550169757
Iteration [  403  ]
Obj. val : -28.98057479609278, Avg. Ret : -20.502268738184434
Iteration [  404  ]
Obj. val : -28.885588134051172, Avg. Ret : -43.03687796745149
Iteration [  405  ]
Obj. val : -29.29116788363899, Avg. Ret : -37.53650330283003
Iteration [  406  ]
Obj. val : -29.606158976807546, Avg. Ret : -20.543070330587252
Iteration [  407  ]
Obj. val : -29.45854927264258, Avg. Ret : -37.293856725254656
Iteration [  408  ]
Obj. val : -29.29181601305154, Avg. Ret : -43.2777560342845
Iteration [  409  ]
Obj. val : -28.650583484696828, Avg. Ret : -20.63493100809918
Iteration [  410  ]
Obj. val : -29.393435458916585, Avg. Ret : -33.015707337287246
Iteration [  411  ]
Obj. val : -28.81145625697472, Avg. Ret : -42.018788754961044
Iteration [  412  ]
Obj. val : -28.99614943206345, Avg. Ret : -20.730178045299063
Iteration [  413  ]
Obj. val : -28.907019210420977, Avg. Ret : -39.05642106413517
Iteration [  414  ]
Obj. val : -28.881869134907767, Avg. Ret : -14.616994770310328
Iteration [  415  ]
Obj. val : -28.740960644875113, Avg. Ret : -20.59238136547005
Iteration [  416  ]
Obj. val : -28.993694937205174, Avg. Ret : -41.597467254276445
Iteration [  417  ]
Obj. val : -29.008187711780707, Avg. Ret : -29.476036808588137
Iteration [  418  ]
Obj. val : -28.869790504789226, Avg. Ret : -20.635726353010636
Iteration [  419  ]
Obj. val : -29.11848231318048, Avg. Ret : -9.867116462436686
Iteration [  420  ]
Obj. val : -28.046204505365722, Avg. Ret : -39.29492590128248
Iteration [  421  ]
Obj. val : -28.928721176169816, Avg. Ret : -20.7571573381077
Iteration [  422  ]
Obj. val : -28.472629081939722, Avg. Ret : -13.626314961565377
Iteration [  423  ]
Obj. val : -28.36773996058014, Avg. Ret : -36.12115627204693
Iteration [  424  ]
Obj. val : -28.543048757718996, Avg. Ret : -20.897910085568864
Iteration [  425  ]
Obj. val : -28.300211380236785, Avg. Ret : -16.513092655400907
Iteration [  426  ]
Obj. val : -28.666160884845546, Avg. Ret : -38.57174985301302
Iteration [  427  ]
Obj. val : -28.58406720358012, Avg. Ret : -20.703103453658823
Iteration [  428  ]
Obj. val : -28.11775854020649, Avg. Ret : -28.110867594250127
Iteration [  429  ]
Obj. val : -28.637774912715827, Avg. Ret : -39.427392488068755
Iteration [  430  ]
Obj. val : -28.53773303305794, Avg. Ret : -20.78312730460025
Iteration [  431  ]
Obj. val : -28.654782719560917, Avg. Ret : -38.69632549205343
Iteration [  432  ]
Obj. val : -28.54977305471958, Avg. Ret : -23.04501770583722
Iteration [  433  ]
Obj. val : -28.535248756851434, Avg. Ret : -20.73296571094239
Iteration [  434  ]
Obj. val : -27.91202295884398, Avg. Ret : -39.28256980175206
Iteration [  435  ]
Obj. val : -28.19908994273589, Avg. Ret : -28.83984226657866
Iteration [  436  ]
Obj. val : -28.78263396782838, Avg. Ret : -20.830095656532645
Iteration [  437  ]
Obj. val : -28.19532348825496, Avg. Ret : -29.525487775267237
Iteration [  438  ]
Obj. val : -27.974136007210966, Avg. Ret : -38.77976213322626
Iteration [  439  ]
Obj. val : -28.543871433763556, Avg. Ret : -20.937672259870407
Iteration [  440  ]
Obj. val : -27.973943832995264, Avg. Ret : -39.04988355112277
Iteration [  441  ]
Obj. val : -28.65216849902818, Avg. Ret : -30.20420239210859
Iteration [  442  ]
Obj. val : -27.955042703373664, Avg. Ret : -20.855727876404554
Iteration [  443  ]
Obj. val : -28.129642114079957, Avg. Ret : -30.530773445580895
Iteration [  444  ]
Obj. val : -28.376625365198723, Avg. Ret : -38.607694879956
Iteration [  445  ]
Obj. val : -28.59837927790729, Avg. Ret : -20.988237660606533
Iteration [  446  ]
Obj. val : -27.97234105081455, Avg. Ret : -37.60126317076974
Iteration [  447  ]
Obj. val : -27.970894490141212, Avg. Ret : -30.50195544717139
Iteration [  448  ]
Obj. val : -28.72502624363656, Avg. Ret : -21.18703858719929
Iteration [  449  ]
Obj. val : -28.69595844547131, Avg. Ret : -31.331084790901624
Iteration [  450  ]
Obj. val : -28.620855291828832, Avg. Ret : -37.47896199433347
Iteration [  451  ]
Obj. val : -28.65003821063728, Avg. Ret : -20.989284706226012
Iteration [  452  ]
Obj. val : -27.874370302116454, Avg. Ret : -31.812488075741598
Iteration [  453  ]
Obj. val : -28.301859090567138, Avg. Ret : -37.353156927360594
Iteration [  454  ]
Obj. val : -28.213473610695253, Avg. Ret : -21.141451328880347
Iteration [  455  ]
Obj. val : -28.298647464018895, Avg. Ret : -37.160546716773
Iteration [  456  ]
Obj. val : -27.941669875579922, Avg. Ret : -32.402625742692976
Iteration [  457  ]
Obj. val : -28.68247543444179, Avg. Ret : -21.329615391627758
Iteration [  458  ]
Obj. val : -28.17419064070072, Avg. Ret : -37.98132820999167
Iteration [  459  ]
Obj. val : -28.532743968948072, Avg. Ret : -32.52695889308683
Iteration [  460  ]
Obj. val : -28.468942870124096, Avg. Ret : -21.310485431778606
Iteration [  461  ]
Obj. val : -27.90344191646304, Avg. Ret : -33.1679911238743
Iteration [  462  ]
Obj. val : -27.983924189843588, Avg. Ret : -36.95800419140732
Iteration [  463  ]
Obj. val : -28.241923639833995, Avg. Ret : -21.5197048028766
Iteration [  464  ]
Obj. val : -27.98470793206978, Avg. Ret : -33.37569207780315
Iteration [  465  ]
Obj. val : -28.052350294351363, Avg. Ret : -37.06748274703789
Iteration [  466  ]
Obj. val : -28.622986113282863, Avg. Ret : -21.63233389634864
Iteration [  467  ]
Obj. val : -28.314785812147434, Avg. Ret : -33.70441657607284
Iteration [  468  ]
Obj. val : -27.90300191419586, Avg. Ret : -36.759740960319675
Iteration [  469  ]
Obj. val : -28.268359317050503, Avg. Ret : -21.74882608826951
Iteration [  470  ]
Obj. val : -28.20287144512691, Avg. Ret : -34.17769508767276
Iteration [  471  ]
Obj. val : -28.23933727539515, Avg. Ret : -36.79191913334821
Iteration [  472  ]
Obj. val : -28.089567642242837, Avg. Ret : -21.787897302810787
Iteration [  473  ]
Obj. val : -28.437168577210134, Avg. Ret : -33.92946999333648
Iteration [  474  ]
Obj. val : -28.274876078390037, Avg. Ret : -37.23106276476633
Iteration [  475  ]
Obj. val : -28.344972593475138, Avg. Ret : -21.86251500204452
Iteration [  476  ]
Obj. val : -28.259816363805434, Avg. Ret : -34.13653845054273
Iteration [  477  ]
Obj. val : -28.308026330290613, Avg. Ret : -37.214087223476014
Iteration [  478  ]
Obj. val : -28.351668835263, Avg. Ret : -22.042357992377458
Iteration [  479  ]
Obj. val : -28.18194428953818, Avg. Ret : -34.54597157525652
Iteration [  480  ]
Obj. val : -28.196250973621336, Avg. Ret : -36.5406342356655
Iteration [  481  ]
Obj. val : -28.57494184577724, Avg. Ret : -22.133318767810188
Iteration [  482  ]
Obj. val : -28.314574967143248, Avg. Ret : -36.940389708138184
Iteration [  483  ]
Obj. val : -28.389605718553664, Avg. Ret : -34.52058804915741
Iteration [  484  ]
Obj. val : -28.162833773593565, Avg. Ret : -22.021298819672428
Iteration [  485  ]
Obj. val : -27.84347166995333, Avg. Ret : -36.82935535517133
Iteration [  486  ]
Obj. val : -28.035610633182777, Avg. Ret : -34.58326639852408
Iteration [  487  ]
Obj. val : -28.14318985556963, Avg. Ret : -22.197191092570115
Iteration [  488  ]
Obj. val : -28.607042617778074, Avg. Ret : -34.69049012729194
Iteration [  489  ]
Obj. val : -28.123111199562416, Avg. Ret : -36.931681866627784
Iteration [  490  ]
Obj. val : 43.26393913861534, Avg. Ret : -22.216881455199555
Iteration [  491  ]
Obj. val : -28.072998368937423, Avg. Ret : -36.472914988186055
Iteration [  492  ]
Obj. val : -28.233334941658693, Avg. Ret : -34.924926660447426
Iteration [  493  ]
Obj. val : -27.682005654816447, Avg. Ret : -22.481599379881214
Iteration [  494  ]
Obj. val : -28.065887890448344, Avg. Ret : -36.63203413471924
Iteration [  495  ]
Obj. val : -28.206092322425583, Avg. Ret : -35.1190811196239
Iteration [  496  ]
Obj. val : -28.155694894873932, Avg. Ret : -22.519568072581265
Iteration [  497  ]
Obj. val : -28.233788429065758, Avg. Ret : -35.2744012775308
Iteration [  498  ]
Obj. val : -28.27785100657247, Avg. Ret : -36.38275455968915
Iteration [  499  ]
Obj. val : 42.93186928061486, Avg. Ret : -22.65871111655041
checkpoint for objective values, iteration: 500. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_1.csv
checkpoint for objective values, iteration: 500. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_1.csv
batch = 2
inside iterator
Iteration [  0  ]
Obj. val : -23.587864473803208, Avg. Ret : -24.191198563283937
Iteration [  1  ]
Obj. val : -23.157467430337032, Avg. Ret : -24.14833721757311
Iteration [  2  ]
Obj. val : -23.539489221086978, Avg. Ret : -24.144373106824858
Iteration [  3  ]
Obj. val : -23.11743867353145, Avg. Ret : -24.183964922908245
Iteration [  4  ]
Obj. val : -22.980304122174193, Avg. Ret : -24.00682171145495
Iteration [  5  ]
Obj. val : -23.42231813585963, Avg. Ret : -24.094707467994596
Iteration [  6  ]
Obj. val : -23.05894608468184, Avg. Ret : -23.829223385048273
Iteration [  7  ]
Obj. val : -23.313602189561482, Avg. Ret : -24.19525985653484
Iteration [  8  ]
Obj. val : -22.184003571438218, Avg. Ret : -24.224401925113117
Iteration [  9  ]
Obj. val : -22.533596681710815, Avg. Ret : -24.04398126373414
Iteration [  10  ]
Obj. val : -22.304416771443094, Avg. Ret : -24.35195562834573
Iteration [  11  ]
Obj. val : -23.23239250431601, Avg. Ret : -24.20384536979196
Iteration [  12  ]
Obj. val : -23.352239877882724, Avg. Ret : -23.900990599975053
Iteration [  13  ]
Obj. val : -22.971778483002524, Avg. Ret : -24.06998197083073
Iteration [  14  ]
Obj. val : -22.91780870807708, Avg. Ret : -24.259614716611022
Iteration [  15  ]
Obj. val : -22.87161433079164, Avg. Ret : -24.01239933486896
Iteration [  16  ]
Obj. val : -22.468254804333995, Avg. Ret : -24.366084739862867
Iteration [  17  ]
Obj. val : 54.25825482997869, Avg. Ret : -24.096914861838783
Iteration [  18  ]
Obj. val : -23.18321156419509, Avg. Ret : -24.25545967817512
Iteration [  19  ]
Obj. val : -23.307344916683938, Avg. Ret : -24.16559329898223
Iteration [  20  ]
Obj. val : -22.735116496517197, Avg. Ret : -44.51288227617001
Iteration [  21  ]
Obj. val : -22.677379064326242, Avg. Ret : -36.92803477316463
Iteration [  22  ]
Obj. val : -22.55579352746258, Avg. Ret : -32.03866669864492
Iteration [  23  ]
Obj. val : -22.67098535885784, Avg. Ret : -28.38714532094956
Iteration [  24  ]
Obj. val : -22.480094141886838, Avg. Ret : -17.69429688321321
Iteration [  25  ]
Obj. val : -22.85161321441129, Avg. Ret : -30.879963528141147
Iteration [  26  ]
Obj. val : -22.81985522914444, Avg. Ret : -20.129683760856338
Iteration [  27  ]
Obj. val : -22.23572640448906, Avg. Ret : -29.32184275307322
Iteration [  28  ]
Obj. val : -22.79145042539991, Avg. Ret : -20.758331047060043
Iteration [  29  ]
Obj. val : -22.650396251240803, Avg. Ret : -28.404035403674992
Iteration [  30  ]
Obj. val : -22.48419371739619, Avg. Ret : -27.867696145951005
Iteration [  31  ]
Obj. val : -21.88335458152601, Avg. Ret : -21.043236643175593
Iteration [  32  ]
Obj. val : -22.450418530733426, Avg. Ret : -21.916243968613863
Iteration [  33  ]
Obj. val : -22.17304052312362, Avg. Ret : -26.75431422452428
Iteration [  34  ]
Obj. val : -22.28045800146677, Avg. Ret : -21.853748637307163
Iteration [  35  ]
Obj. val : -22.352413414554373, Avg. Ret : -27.031418436801335
Iteration [  36  ]
Obj. val : -22.309476728190926, Avg. Ret : -26.340324960517222
Iteration [  37  ]
Obj. val : -22.028744957402015, Avg. Ret : -22.336850633906735
Iteration [  38  ]
Obj. val : -22.368949372426446, Avg. Ret : -23.883797617625973
Iteration [  39  ]
Obj. val : -22.479502308051707, Avg. Ret : -22.395840485159994
Iteration [  40  ]
Obj. val : -21.891453498621896, Avg. Ret : -24.892169832391783
Iteration [  41  ]
Obj. val : -22.411708156814875, Avg. Ret : -24.76274954967536
Iteration [  42  ]
Obj. val : -22.384934716439634, Avg. Ret : -23.67467757270147
Iteration [  43  ]
Obj. val : -21.824959210875807, Avg. Ret : -24.66614836786719
Iteration [  44  ]
Obj. val : -21.962843597448956, Avg. Ret : -23.87523788271268
Iteration [  45  ]
Obj. val : -21.929775423203814, Avg. Ret : -24.770529122526586
Iteration [  46  ]
Obj. val : -21.939385273494175, Avg. Ret : -24.759082594856267
Iteration [  47  ]
Obj. val : -21.888762397259732, Avg. Ret : -23.91260113633138
Iteration [  48  ]
Obj. val : -22.037669268983375, Avg. Ret : -24.77891889181337
Iteration [  49  ]
Obj. val : -21.988227468777147, Avg. Ret : -24.785938639740845
Iteration [  50  ]
Obj. val : 53.54863009742081, Avg. Ret : -24.830665813158358
Iteration [  51  ]
Obj. val : -22.309034986325603, Avg. Ret : -24.32695543291966
Iteration [  52  ]
Obj. val : -22.236172072197963, Avg. Ret : -24.828553345671818
Iteration [  53  ]
Obj. val : -21.522417904299907, Avg. Ret : -21.82803365736404
Iteration [  54  ]
Obj. val : -21.34772202809019, Avg. Ret : -24.81591895209708
Iteration [  55  ]
Obj. val : -21.533300033704887, Avg. Ret : -24.599291532373126
Iteration [  56  ]
Obj. val : -22.018233003695574, Avg. Ret : -22.557194916088225
Iteration [  57  ]
Obj. val : -22.227308210832195, Avg. Ret : -24.531233245002618
Iteration [  58  ]
Obj. val : -21.99178759073653, Avg. Ret : -24.780598477286254
Iteration [  59  ]
Obj. val : -21.605046173308203, Avg. Ret : -23.943919790843076
Iteration [  60  ]
Obj. val : -22.348733428113945, Avg. Ret : -22.600068653882335
Iteration [  61  ]
Obj. val : -21.92397795616662, Avg. Ret : -24.85262932805962
Iteration [  62  ]
Obj. val : -21.96194188081914, Avg. Ret : -22.469445168847496
Iteration [  63  ]
Obj. val : -22.95165861182345, Avg. Ret : -23.616496992144075
Iteration [  64  ]
Obj. val : -22.000936699399105, Avg. Ret : -24.70039112913884
Iteration [  65  ]
Obj. val : -22.005630671704502, Avg. Ret : -22.418096463522424
Iteration [  66  ]
Obj. val : -22.27255235021001, Avg. Ret : -23.344445185764066
Iteration [  67  ]
Obj. val : -22.66600562179989, Avg. Ret : -24.648830954930357
Iteration [  68  ]
Obj. val : -22.41009507649573, Avg. Ret : -22.24510341016763
Iteration [  69  ]
Obj. val : -22.482527199555474, Avg. Ret : -22.845700492648806
Iteration [  70  ]
Obj. val : -22.180341170474808, Avg. Ret : -24.614535441389776
Iteration [  71  ]
Obj. val : -22.43250460012041, Avg. Ret : -22.12159719072295
Iteration [  72  ]
Obj. val : -21.808753052072223, Avg. Ret : -22.908363714610445
Iteration [  73  ]
Obj. val : -22.79226931785295, Avg. Ret : -24.638121174197874
Iteration [  74  ]
Obj. val : -22.132603383306094, Avg. Ret : -22.08202110378123
Iteration [  75  ]
Obj. val : -23.25852159884712, Avg. Ret : -22.67434832827963
Iteration [  76  ]
Obj. val : -22.60644785658651, Avg. Ret : -24.761641550866734
Iteration [  77  ]
Obj. val : -22.8083149665613, Avg. Ret : -21.86515300620376
Iteration [  78  ]
Obj. val : -22.97830420947775, Avg. Ret : -22.588647196218094
Iteration [  79  ]
Obj. val : -23.219731868519375, Avg. Ret : -24.823222565021737
Iteration [  80  ]
Obj. val : -22.672254776703227, Avg. Ret : -21.995219618610694
Iteration [  81  ]
Obj. val : -23.007752040667786, Avg. Ret : -22.52538544249195
Iteration [  82  ]
Obj. val : -22.674786355957874, Avg. Ret : -24.575354717578374
Iteration [  83  ]
Obj. val : -23.643892287679655, Avg. Ret : -22.059193795226598
Iteration [  84  ]
Obj. val : -23.227201512952163, Avg. Ret : -22.11862574022103
Iteration [  85  ]
Obj. val : -23.28288437407891, Avg. Ret : -24.505353346629427
Iteration [  86  ]
Obj. val : -23.495676412030146, Avg. Ret : -22.09032190243438
Iteration [  87  ]
Obj. val : -23.553130752192562, Avg. Ret : -21.820529503754038
Iteration [  88  ]
Obj. val : -23.794007588305522, Avg. Ret : -24.160772571390716
Iteration [  89  ]
Obj. val : -23.709500298119035, Avg. Ret : -21.765503656765972
Iteration [  90  ]
Obj. val : -23.5683975082264, Avg. Ret : -22.06527224677819
Iteration [  91  ]
Obj. val : -24.03725919942247, Avg. Ret : -22.49718295348686
Iteration [  92  ]
Obj. val : -23.62897787116122, Avg. Ret : -21.736587943755918
Iteration [  93  ]
Obj. val : -23.67987409051199, Avg. Ret : -22.240186388227634
Iteration [  94  ]
Obj. val : -23.952424431387982, Avg. Ret : -24.53088142655921
Iteration [  95  ]
Obj. val : -23.875004990055583, Avg. Ret : -21.618469506693838
Iteration [  96  ]
Obj. val : -24.25895314727816, Avg. Ret : -21.97557774581594
Iteration [  97  ]
Obj. val : -24.515428944650132, Avg. Ret : -24.43070409118825
Iteration [  98  ]
Obj. val : -24.536285576487902, Avg. Ret : -21.504317484878506
Iteration [  99  ]
Obj. val : -24.21028930968972, Avg. Ret : -21.69462078584075
checkpoint for objective values, iteration: 100. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_2.csv
checkpoint for avg return values, iteration: 100. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_2.csv
Iteration [  100  ]
Obj. val : -24.43529853537046, Avg. Ret : -24.38591992053114
Iteration [  101  ]
Obj. val : -24.56361231861465, Avg. Ret : -21.460670451515615
Iteration [  102  ]
Obj. val : -25.3201098484198, Avg. Ret : -21.410123078731417
Iteration [  103  ]
Obj. val : 50.3913565745203, Avg. Ret : -24.234679895854548
Iteration [  104  ]
Obj. val : -24.943795778120265, Avg. Ret : -21.516368306855224
Iteration [  105  ]
Obj. val : -24.957607134820798, Avg. Ret : -21.165529539326073
Iteration [  106  ]
Obj. val : -23.90957074607926, Avg. Ret : -24.19790446719552
Iteration [  107  ]
Obj. val : -25.17979460228584, Avg. Ret : -21.24281035721179
Iteration [  108  ]
Obj. val : -25.528930466639135, Avg. Ret : -21.364934200154153
Iteration [  109  ]
Obj. val : -25.425200526765448, Avg. Ret : -24.370050181107302
Iteration [  110  ]
Obj. val : -25.046247021392176, Avg. Ret : -21.324181389423153
Iteration [  111  ]
Obj. val : -25.46546314984284, Avg. Ret : -21.23507316821763
Iteration [  112  ]
Obj. val : -25.154044212378565, Avg. Ret : -24.433723796430453
Iteration [  113  ]
Obj. val : -25.085170540053973, Avg. Ret : -21.176769533279106
Iteration [  114  ]
Obj. val : -25.104868274367774, Avg. Ret : -21.410634760095927
Iteration [  115  ]
Obj. val : -25.1841526035026, Avg. Ret : -24.40789568566715
Iteration [  116  ]
Obj. val : 49.52207634670746, Avg. Ret : -21.255707090131
Iteration [  117  ]
Obj. val : -25.670037056084535, Avg. Ret : -21.248254471485293
Iteration [  118  ]
Obj. val : -25.302295965619226, Avg. Ret : -24.17259082733269
Iteration [  119  ]
Obj. val : -25.505618871129684, Avg. Ret : -21.14381275609732
Iteration [  120  ]
Obj. val : -25.22418791516159, Avg. Ret : -21.181186138090013
Iteration [  121  ]
Obj. val : -25.72383437184594, Avg. Ret : -24.128491542289662
Iteration [  122  ]
Obj. val : -25.274075630827987, Avg. Ret : -21.079790167445804
Iteration [  123  ]
Obj. val : -25.60700819001476, Avg. Ret : -20.938189026248423
Iteration [  124  ]
Obj. val : -25.52850753306948, Avg. Ret : -24.45256812401483
Iteration [  125  ]
Obj. val : -25.16854326349486, Avg. Ret : -20.92680780483883
Iteration [  126  ]
Obj. val : -25.366338857077793, Avg. Ret : -20.883715534642953
Iteration [  127  ]
Obj. val : 47.81919073133303, Avg. Ret : -24.200273043377123
Iteration [  128  ]
Obj. val : -25.08859025578958, Avg. Ret : -20.867005742273673
Iteration [  129  ]
Obj. val : -25.79283310813583, Avg. Ret : -20.90499963052274
Iteration [  130  ]
Obj. val : -25.959303720106544, Avg. Ret : -24.105810704201545
Iteration [  131  ]
Obj. val : -25.830537978496576, Avg. Ret : -21.13603815114429
Iteration [  132  ]
Obj. val : -25.531358741084517, Avg. Ret : -21.13091087451559
Iteration [  133  ]
Obj. val : -25.68964731378654, Avg. Ret : -23.943551426015503
Iteration [  134  ]
Obj. val : -25.490170974629876, Avg. Ret : -21.072272982527124
Iteration [  135  ]
Obj. val : -25.7344457394009, Avg. Ret : -20.9048896254772
Iteration [  136  ]
Obj. val : -25.60749897096218, Avg. Ret : -24.22513120456186
Iteration [  137  ]
Obj. val : -25.964534118870983, Avg. Ret : -21.08453398606295
Iteration [  138  ]
Obj. val : -24.887604030152527, Avg. Ret : -20.86612029396214
Iteration [  139  ]
Obj. val : -25.74752511491077, Avg. Ret : -23.99100724197272
Iteration [  140  ]
Obj. val : -25.524249442254934, Avg. Ret : -20.992790185735092
Iteration [  141  ]
Obj. val : -25.040780262685896, Avg. Ret : -21.167700086066688
Iteration [  142  ]
Obj. val : -25.629446488930196, Avg. Ret : -23.950101864978116
Iteration [  143  ]
Obj. val : -25.65698721828878, Avg. Ret : -20.945261597572983
Iteration [  144  ]
Obj. val : -25.81546981447333, Avg. Ret : -21.05872143253391
Iteration [  145  ]
Obj. val : -25.746729907163047, Avg. Ret : -23.811150649189667
Iteration [  146  ]
Obj. val : -25.35333861863048, Avg. Ret : -20.67356270758051
Iteration [  147  ]
Obj. val : -26.19408069902573, Avg. Ret : -20.851680178109074
Iteration [  148  ]
Obj. val : -25.612061155922273, Avg. Ret : -23.834266504874723
Iteration [  149  ]
Obj. val : -25.56924898390572, Avg. Ret : -20.786587472118548
Iteration [  150  ]
Obj. val : -26.20351654778673, Avg. Ret : -20.946845041648377
Iteration [  151  ]
Obj. val : -25.83936162274535, Avg. Ret : -24.042765568299938
Iteration [  152  ]
Obj. val : -25.427140107886906, Avg. Ret : -20.878199419032615
Iteration [  153  ]
Obj. val : -25.4303006587095, Avg. Ret : -20.625673538847078
Iteration [  154  ]
Obj. val : -25.51363055339841, Avg. Ret : -23.786410430244526
Iteration [  155  ]
Obj. val : -26.07843093642012, Avg. Ret : -20.90235946821964
Iteration [  156  ]
Obj. val : -25.7259995071481, Avg. Ret : -21.01551877418024
Iteration [  157  ]
Obj. val : -26.147132572095074, Avg. Ret : -23.994276068762
Iteration [  158  ]
Obj. val : -26.134447824489015, Avg. Ret : -20.776214083629593
Iteration [  159  ]
Obj. val : -26.069067313026544, Avg. Ret : -20.88060345114814
Iteration [  160  ]
Obj. val : -25.3883528778019, Avg. Ret : -23.840745057740577
Iteration [  161  ]
Obj. val : -25.708693945662176, Avg. Ret : -20.506718700818123
Iteration [  162  ]
Obj. val : -25.91153130705266, Avg. Ret : -20.730767487256188
Iteration [  163  ]
Obj. val : -25.91817452731248, Avg. Ret : -23.99737926696303
Iteration [  164  ]
Obj. val : -26.28364923446057, Avg. Ret : -20.791401493590453
Iteration [  165  ]
Obj. val : -26.082943678392166, Avg. Ret : -20.625048506297077
Iteration [  166  ]
Obj. val : -25.80466546128192, Avg. Ret : -23.824213212495252
Iteration [  167  ]
Obj. val : -26.31564198448028, Avg. Ret : -20.758070132040917
Iteration [  168  ]
Obj. val : -25.700739165176884, Avg. Ret : -20.46470469786665
Iteration [  169  ]
Obj. val : -26.330092339240526, Avg. Ret : -23.73629719456018
Iteration [  170  ]
Obj. val : -26.099804155564783, Avg. Ret : -20.51807020987059
Iteration [  171  ]
Obj. val : -25.755312223536208, Avg. Ret : -20.709636928698224
Iteration [  172  ]
Obj. val : -26.104853439587917, Avg. Ret : -23.72613769452588
Iteration [  173  ]
Obj. val : -26.051852113157352, Avg. Ret : -20.567980066064468
Iteration [  174  ]
Obj. val : -26.353258636576246, Avg. Ret : -20.772317059089215
Iteration [  175  ]
Obj. val : -26.293265969854286, Avg. Ret : -23.7880152685233
Iteration [  176  ]
Obj. val : -26.221260354815566, Avg. Ret : -20.389453960780692
Iteration [  177  ]
Obj. val : -26.556962218334636, Avg. Ret : -20.48584507683555
Iteration [  178  ]
Obj. val : -26.527558964083813, Avg. Ret : -23.80274683310809
Iteration [  179  ]
Obj. val : -26.142967836070408, Avg. Ret : -20.36057063456238
Iteration [  180  ]
Obj. val : -26.582493221127528, Avg. Ret : -20.75812741286275
Iteration [  181  ]
Obj. val : -26.611638876661196, Avg. Ret : -23.766813717228114
Iteration [  182  ]
Obj. val : -26.456931131511453, Avg. Ret : -20.528951081592144
Iteration [  183  ]
Obj. val : -26.381715968076605, Avg. Ret : -20.76543944643733
Iteration [  184  ]
Obj. val : -26.722924151149876, Avg. Ret : -23.69640142413111
Iteration [  185  ]
Obj. val : -26.67460714264436, Avg. Ret : -18.446274537550448
Iteration [  186  ]
Obj. val : -26.513612430342654, Avg. Ret : -20.44399620856811
Iteration [  187  ]
Obj. val : -27.063903856548645, Avg. Ret : -23.687539375842615
Iteration [  188  ]
Obj. val : -26.554214467103932, Avg. Ret : -20.473245748215483
Iteration [  189  ]
Obj. val : -26.879119199992907, Avg. Ret : -22.108462752188938
Iteration [  190  ]
Obj. val : -27.440823356211563, Avg. Ret : -21.494380841851445
Iteration [  191  ]
Obj. val : -27.310856896738144, Avg. Ret : -22.1813200471932
Iteration [  192  ]
Obj. val : -27.239702498410647, Avg. Ret : -23.915428600182665
Iteration [  193  ]
Obj. val : -27.224421547983933, Avg. Ret : -23.669745573718384
Iteration [  194  ]
Obj. val : -26.899076817486073, Avg. Ret : -24.840794000405296
Iteration [  195  ]
Obj. val : 45.60261064801638, Avg. Ret : -23.153375874237927
Iteration [  196  ]
Obj. val : -26.536754127536298, Avg. Ret : -23.734895215618927
Iteration [  197  ]
Obj. val : -27.06272647073846, Avg. Ret : -25.48295707926503
Iteration [  198  ]
Obj. val : -27.355656654990792, Avg. Ret : -23.089445701956098
Iteration [  199  ]
Obj. val : -27.18392398588904, Avg. Ret : -23.551012720485595
checkpoint for objective values, iteration: 200. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_2.csv
checkpoint for avg return values, iteration: 200. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_2.csv
Iteration [  200  ]
Obj. val : -27.838209512035935, Avg. Ret : -26.230543802330523
Iteration [  201  ]
Obj. val : -27.33559779201604, Avg. Ret : -24.045254505048867
Iteration [  202  ]
Obj. val : -26.74258915098565, Avg. Ret : -23.7093340625994
Iteration [  203  ]
Obj. val : -27.605869861202766, Avg. Ret : -26.50226061640961
Iteration [  204  ]
Obj. val : -27.52058359122627, Avg. Ret : -24.24086330608286
Iteration [  205  ]
Obj. val : 45.03812002804844, Avg. Ret : -23.487901668797647
Iteration [  206  ]
Obj. val : -27.563300330694403, Avg. Ret : -25.019735970634034
Iteration [  207  ]
Obj. val : 45.1842490350497, Avg. Ret : -24.70305713782633
Iteration [  208  ]
Obj. val : -27.023313737252945, Avg. Ret : -23.765222300924105
Iteration [  209  ]
Obj. val : 43.842206528759775, Avg. Ret : -25.534160927339773
Iteration [  210  ]
Obj. val : -27.95710033228643, Avg. Ret : -27.292553787299106
Iteration [  211  ]
Obj. val : -28.167826850372116, Avg. Ret : -23.86305898861077
Iteration [  212  ]
Obj. val : -27.255940918422425, Avg. Ret : -26.274494076467292
Iteration [  213  ]
Obj. val : -27.415840834545744, Avg. Ret : -27.084234016402807
Iteration [  214  ]
Obj. val : -28.027817918692875, Avg. Ret : -23.660519320500516
Iteration [  215  ]
Obj. val : -27.452672601581593, Avg. Ret : -27.573496972396565
Iteration [  216  ]
Obj. val : 44.60507472499977, Avg. Ret : -26.76476720555435
Iteration [  217  ]
Obj. val : -28.1390682323269, Avg. Ret : -23.689258499110856
Iteration [  218  ]
Obj. val : -28.444284412804958, Avg. Ret : -26.818677822598456
Iteration [  219  ]
Obj. val : -28.189836801163132, Avg. Ret : -27.800251502113404
Iteration [  220  ]
Obj. val : -28.143134882485196, Avg. Ret : -23.701366198999267
Iteration [  221  ]
Obj. val : 47.355360174107865, Avg. Ret : -28.076470241375524
Iteration [  222  ]
Obj. val : -28.135199070893176, Avg. Ret : -26.929017811497467
Iteration [  223  ]
Obj. val : -28.2941362938687, Avg. Ret : -23.603479499766223
Iteration [  224  ]
Obj. val : -28.456326617627926, Avg. Ret : -27.99571182416068
Iteration [  225  ]
Obj. val : -28.316958460366987, Avg. Ret : -27.487837161564418
Iteration [  226  ]
Obj. val : -28.447728521637558, Avg. Ret : -23.977087867551287
Iteration [  227  ]
Obj. val : -28.676633310003037, Avg. Ret : -27.759816913859655
Iteration [  228  ]
Obj. val : -28.546109944969206, Avg. Ret : -28.518022051436947
Iteration [  229  ]
Obj. val : -28.641048447535997, Avg. Ret : -24.133599451290376
Iteration [  230  ]
Obj. val : -28.727182547484055, Avg. Ret : -28.6618973899251
Iteration [  231  ]
Obj. val : -28.694210043174714, Avg. Ret : -28.40399152966575
Iteration [  232  ]
Obj. val : -27.964317158912355, Avg. Ret : -23.683417222415116
Iteration [  233  ]
Obj. val : -28.63832067816938, Avg. Ret : -29.021357502106554
Iteration [  234  ]
Obj. val : -29.033395180911736, Avg. Ret : -28.306185814789373
Iteration [  235  ]
Obj. val : -29.398980588544553, Avg. Ret : -23.848764314780283
Iteration [  236  ]
Obj. val : -29.24075081380358, Avg. Ret : -28.93563305679838
Iteration [  237  ]
Obj. val : -29.322386463842097, Avg. Ret : -28.534412897122614
Iteration [  238  ]
Obj. val : -29.13114595930234, Avg. Ret : -23.840989735326275
Iteration [  239  ]
Obj. val : -28.889514864873387, Avg. Ret : -28.571377501618954
Iteration [  240  ]
Obj. val : -28.84005236273137, Avg. Ret : -29.19253784117963
Iteration [  241  ]
Obj. val : 43.94334418208182, Avg. Ret : -24.094092497100288
Iteration [  242  ]
Obj. val : -29.354335860830496, Avg. Ret : -29.357988326839095
Iteration [  243  ]
Obj. val : -29.59967430156887, Avg. Ret : -28.754903596688592
Iteration [  244  ]
Obj. val : -30.058346658139328, Avg. Ret : -23.954469061551258
Iteration [  245  ]
Obj. val : -30.20270361833753, Avg. Ret : -29.313708715893952
Iteration [  246  ]
Obj. val : -29.1175295651278, Avg. Ret : -29.05906914896366
Iteration [  247  ]
Obj. val : -29.956981586239323, Avg. Ret : -23.94887764771553
Iteration [  248  ]
Obj. val : 48.455346104270866, Avg. Ret : -29.213972075997727
Iteration [  249  ]
Obj. val : -30.5124556548131, Avg. Ret : -29.404447247808758
Iteration [  250  ]
Obj. val : -29.999990693217214, Avg. Ret : -24.17597532492735
Iteration [  251  ]
Obj. val : -29.72317271475863, Avg. Ret : -29.2601468097651
Iteration [  252  ]
Obj. val : -30.303109039077388, Avg. Ret : -29.740510427108717
Iteration [  253  ]
Obj. val : -30.48153384409245, Avg. Ret : -23.938839919494463
Iteration [  254  ]
Obj. val : -29.93579267129759, Avg. Ret : -29.733383783257047
Iteration [  255  ]
Obj. val : 48.52302092117522, Avg. Ret : -29.41446946416264
Iteration [  256  ]
Obj. val : -30.266024664868155, Avg. Ret : -24.18067248043537
Iteration [  257  ]
Obj. val : -30.52739960639446, Avg. Ret : -29.642073617591354
Iteration [  258  ]
Obj. val : -29.64046336922802, Avg. Ret : -27.948853511624748
Iteration [  259  ]
Obj. val : 42.79405802080744, Avg. Ret : -24.47191755587632
Iteration [  260  ]
Obj. val : -30.246446586309705, Avg. Ret : -29.742295869537024
Iteration [  261  ]
Obj. val : -30.3485006921331, Avg. Ret : -30.367046610287183
Iteration [  262  ]
Obj. val : -30.524994210850217, Avg. Ret : -24.48361247615995
Iteration [  263  ]
Obj. val : -30.62760185782355, Avg. Ret : -30.901963440953203
Iteration [  264  ]
Obj. val : -31.294152773244903, Avg. Ret : -29.85528070142787
Iteration [  265  ]
Obj. val : -30.661454327904362, Avg. Ret : -24.61368341383112
Iteration [  266  ]
Obj. val : -30.623747778536515, Avg. Ret : -30.256973183061508
Iteration [  267  ]
Obj. val : -31.071680091834477, Avg. Ret : -30.938963806438537
Iteration [  268  ]
Obj. val : -31.556210931570337, Avg. Ret : -24.343649234609526
Iteration [  269  ]
Obj. val : -31.225867648904078, Avg. Ret : -30.924844586664527
Iteration [  270  ]
Obj. val : -31.121236312865122, Avg. Ret : -30.6103648215092
Iteration [  271  ]
Obj. val : -31.6927809061418, Avg. Ret : -24.351813950801308
Iteration [  272  ]
Obj. val : -31.199142852714456, Avg. Ret : -31.20537895082677
Iteration [  273  ]
Obj. val : -31.994028038531507, Avg. Ret : -30.568257752146206
Iteration [  274  ]
Obj. val : 44.81416854521149, Avg. Ret : -24.646200674097017
Iteration [  275  ]
Obj. val : -31.491021034387778, Avg. Ret : -30.749694807388423
Iteration [  276  ]
Obj. val : -31.882182515822443, Avg. Ret : -31.122062373409616
Iteration [  277  ]
Obj. val : -32.01403669713217, Avg. Ret : -24.720471614004378
Iteration [  278  ]
Obj. val : -32.0469124563395, Avg. Ret : -31.111932384661763
Iteration [  279  ]
Obj. val : 40.515965218583844, Avg. Ret : -31.418623660469148
Iteration [  280  ]
Obj. val : -31.928379758274502, Avg. Ret : -24.59420147463889
Iteration [  281  ]
Obj. val : -31.293954449540433, Avg. Ret : -31.573561370445645
Iteration [  282  ]
Obj. val : -31.715152962701467, Avg. Ret : -31.005525512839785
Iteration [  283  ]
Obj. val : -32.129717485688104, Avg. Ret : -24.687866795726823
Iteration [  284  ]
Obj. val : -31.63581000479884, Avg. Ret : -31.602122195101824
Iteration [  285  ]
Obj. val : -31.836651238612333, Avg. Ret : -31.07422000264497
Iteration [  286  ]
Obj. val : -31.44176631490031, Avg. Ret : -24.875498618324073
Iteration [  287  ]
Obj. val : -32.19113467675729, Avg. Ret : -31.599045693028085
Iteration [  288  ]
Obj. val : -31.890047812091694, Avg. Ret : -31.392216407159093
Iteration [  289  ]
Obj. val : -32.036133249206195, Avg. Ret : -24.798192256064926
Iteration [  290  ]
Obj. val : -32.72790456870856, Avg. Ret : -29.647530007655046
Iteration [  291  ]
Obj. val : -32.35938029924198, Avg. Ret : -31.47526628897866
Iteration [  292  ]
Obj. val : -32.49370691655501, Avg. Ret : -24.83032616569361
Iteration [  293  ]
Obj. val : 43.41417887573996, Avg. Ret : -32.382200095291566
Iteration [  294  ]
Obj. val : -32.32037243593707, Avg. Ret : -31.855850449418696
Iteration [  295  ]
Obj. val : 43.11937705026098, Avg. Ret : -25.104660002897262
Iteration [  296  ]
Obj. val : -31.867879012648377, Avg. Ret : -32.349518502336004
Iteration [  297  ]
Obj. val : 48.00461533924675, Avg. Ret : -31.744326812773647
Iteration [  298  ]
Obj. val : -32.761445095834674, Avg. Ret : -25.010602424542824
Iteration [  299  ]
Obj. val : 42.977928350853425, Avg. Ret : -32.473623008491444
checkpoint for objective values, iteration: 300. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_2.csv
checkpoint for avg return values, iteration: 300. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_2.csv
Iteration [  300  ]
Obj. val : 42.77593294499452, Avg. Ret : -32.058810673912916
Iteration [  301  ]
Obj. val : -33.12128558407013, Avg. Ret : -25.253266983579543
Iteration [  302  ]
Obj. val : -32.481905654934785, Avg. Ret : -32.45368001670851
Iteration [  303  ]
Obj. val : -32.63841203902801, Avg. Ret : -32.75791335696767
Iteration [  304  ]
Obj. val : -33.20736677286702, Avg. Ret : -25.2316089798512
Iteration [  305  ]
Obj. val : -33.19587867986244, Avg. Ret : -32.34329519101036
Iteration [  306  ]
Obj. val : -32.73428286409447, Avg. Ret : -32.99010164454654
Iteration [  307  ]
Obj. val : -32.82877454306935, Avg. Ret : -25.390623916197928
Iteration [  308  ]
Obj. val : -32.79965850488192, Avg. Ret : -33.00155667769916
Iteration [  309  ]
Obj. val : -33.058486389957835, Avg. Ret : -32.513856916303254
Iteration [  310  ]
Obj. val : 46.10325259940738, Avg. Ret : -25.5012494227663
Iteration [  311  ]
Obj. val : -33.3072445094564, Avg. Ret : -33.20722043162782
Iteration [  312  ]
Obj. val : -33.04422744980094, Avg. Ret : -32.50075327092868
Iteration [  313  ]
Obj. val : -33.10612958591023, Avg. Ret : -25.599154742153306
Iteration [  314  ]
Obj. val : -33.51034121791694, Avg. Ret : -32.97784192144332
Iteration [  315  ]
Obj. val : -33.54114023829509, Avg. Ret : -33.122229064804536
Iteration [  316  ]
Obj. val : -33.47903154471521, Avg. Ret : -25.426129134960597
Iteration [  317  ]
Obj. val : -33.599926556448324, Avg. Ret : -33.2392075069885
Iteration [  318  ]
Obj. val : -33.54091507893371, Avg. Ret : -32.780672119940874
Iteration [  319  ]
Obj. val : -34.04650930047617, Avg. Ret : -25.428339974630052
Iteration [  320  ]
Obj. val : -33.621989526463395, Avg. Ret : -33.34702277155089
Iteration [  321  ]
Obj. val : -33.6499658367108, Avg. Ret : -33.10341225753984
Iteration [  322  ]
Obj. val : -33.24412553652339, Avg. Ret : -25.68947250297103
Iteration [  323  ]
Obj. val : -32.87744547265185, Avg. Ret : -33.42436060417675
Iteration [  324  ]
Obj. val : -33.80716302390367, Avg. Ret : -33.226211433056456
Iteration [  325  ]
Obj. val : -33.41009431563868, Avg. Ret : -25.63367180972583
Iteration [  326  ]
Obj. val : -33.83616966915038, Avg. Ret : -33.44210840706835
Iteration [  327  ]
Obj. val : 39.212017467528696, Avg. Ret : -33.32625702943901
Iteration [  328  ]
Obj. val : 43.90461768857056, Avg. Ret : -25.867340819027735
Iteration [  329  ]
Obj. val : -33.93642754396002, Avg. Ret : -33.31266294009445
Iteration [  330  ]
Obj. val : 43.656033869239096, Avg. Ret : -33.70607603977798
Iteration [  331  ]
Obj. val : 43.72666623066465, Avg. Ret : -25.962116219291698
Iteration [  332  ]
Obj. val : -34.38443421726979, Avg. Ret : -33.360619705987475
Iteration [  333  ]
Obj. val : -34.44995225804612, Avg. Ret : -33.628064275026965
Iteration [  334  ]
Obj. val : -34.63589031891212, Avg. Ret : -26.055706090108853
Iteration [  335  ]
Obj. val : -34.05009148254564, Avg. Ret : -31.27701656800592
Iteration [  336  ]
Obj. val : 43.953350763950716, Avg. Ret : -33.61828287365426
Iteration [  337  ]
Obj. val : -34.756122880359555, Avg. Ret : -26.12206279542299
Iteration [  338  ]
Obj. val : -33.32854241467766, Avg. Ret : -33.262846314083184
Iteration [  339  ]
Obj. val : -34.87104789402575, Avg. Ret : -33.31615417766282
Iteration [  340  ]
Obj. val : -34.60843749777812, Avg. Ret : -26.18126566715364
Iteration [  341  ]
Obj. val : -34.780209945448505, Avg. Ret : -32.79959685270699
Iteration [  342  ]
Obj. val : 43.82819929928651, Avg. Ret : -33.30176798377224
Iteration [  343  ]
Obj. val : -34.85089543837026, Avg. Ret : -26.286974439093257
Iteration [  344  ]
Obj. val : -34.44613598979277, Avg. Ret : -32.86919177883373
Iteration [  345  ]
Obj. val : 41.48835458030918, Avg. Ret : -33.1331473242864
Iteration [  346  ]
Obj. val : -35.53033508905838, Avg. Ret : -26.57915376543021
Iteration [  347  ]
Obj. val : -34.37306785056525, Avg. Ret : -33.3130795530912
Iteration [  348  ]
Obj. val : -34.68295677556617, Avg. Ret : -32.992725245039544
Iteration [  349  ]
Obj. val : -35.14376747358652, Avg. Ret : -24.286126905173493
Iteration [  350  ]
Obj. val : 54.78037698853991, Avg. Ret : -33.08544978980135
Iteration [  351  ]
Obj. val : -34.55433118300977, Avg. Ret : -32.735855530334064
Iteration [  352  ]
Obj. val : -34.61516652514968, Avg. Ret : -26.57880001003163
Iteration [  353  ]
Obj. val : 38.96953671425966, Avg. Ret : -32.57210314934282
Iteration [  354  ]
Obj. val : 39.11338207219809, Avg. Ret : -33.21833874819699
Iteration [  355  ]
Obj. val : -34.683553346657014, Avg. Ret : -26.537832696054632
Iteration [  356  ]
Obj. val : -35.86128027957765, Avg. Ret : -33.05180126996253
Iteration [  357  ]
Obj. val : 43.59051796911062, Avg. Ret : -32.672366832839614
Iteration [  358  ]
Obj. val : 41.33382101451192, Avg. Ret : -26.394812592039376
Iteration [  359  ]
Obj. val : -35.12690835011666, Avg. Ret : -30.162913422704246
Iteration [  360  ]
Obj. val : -34.59202627902912, Avg. Ret : -33.0027942778117
Iteration [  361  ]
Obj. val : -35.944059662510114, Avg. Ret : -26.697882103605853
Iteration [  362  ]
Obj. val : 36.1429155935183, Avg. Ret : -32.24555513007555
Iteration [  363  ]
Obj. val : 56.64593445162469, Avg. Ret : -32.48975627018568
Iteration [  364  ]
Obj. val : -35.416198404801705, Avg. Ret : -26.74793007493383
Iteration [  365  ]
Obj. val : -36.04162904735814, Avg. Ret : -32.573459962232874
Iteration [  366  ]
Obj. val : -34.91850291543243, Avg. Ret : -32.15236322962707
Iteration [  367  ]
Obj. val : 38.49429695681933, Avg. Ret : -27.028737195407384
Iteration [  368  ]
Obj. val : -36.1156321055882, Avg. Ret : -32.157346625874496
Iteration [  369  ]
Obj. val : -35.97740788262281, Avg. Ret : -32.480085812935535
Iteration [  370  ]
Obj. val : -36.06429393598812, Avg. Ret : -26.634934238280735
Iteration [  371  ]
Obj. val : 59.88969485831821, Avg. Ret : -30.029466842382018
Iteration [  372  ]
Obj. val : -35.595561579564844, Avg. Ret : -32.40112498332115
Iteration [  373  ]
Obj. val : -36.17674324039589, Avg. Ret : -26.910633412345923
Iteration [  374  ]
Obj. val : 44.41641564451172, Avg. Ret : -31.38299737854277
Iteration [  375  ]
Obj. val : 43.10572042674856, Avg. Ret : -31.969805033094026
Iteration [  376  ]
Obj. val : -36.7877985698805, Avg. Ret : -27.10436903038867
Iteration [  377  ]
Obj. val : -35.55450175514269, Avg. Ret : -31.692946205812277
Iteration [  378  ]
Obj. val : 38.72857202065873, Avg. Ret : -31.65590635370066
Iteration [  379  ]
Obj. val : -36.77712906405351, Avg. Ret : -26.82904000804074
Iteration [  380  ]
Obj. val : -35.08671955497261, Avg. Ret : -31.707985544598536
Iteration [  381  ]
Obj. val : -36.305988279907986, Avg. Ret : -31.223578147958506
Iteration [  382  ]
Obj. val : -35.69248942582117, Avg. Ret : -26.801002877596307
Iteration [  383  ]
Obj. val : -36.74467318730131, Avg. Ret : -29.40079096235655
Iteration [  384  ]
Obj. val : -36.7085265741104, Avg. Ret : -31.59518909113906
Iteration [  385  ]
Obj. val : 38.491136389038516, Avg. Ret : -27.08210599432027
Iteration [  386  ]
Obj. val : -35.60366658699433, Avg. Ret : -30.801754138697806
Iteration [  387  ]
Obj. val : 36.8492361575602, Avg. Ret : -31.195840670275402
Iteration [  388  ]
Obj. val : -36.80614285488526, Avg. Ret : -24.950982370543716
Iteration [  389  ]
Obj. val : 43.95201588520739, Avg. Ret : -31.19502661711375
Iteration [  390  ]
Obj. val : -36.308491628236794, Avg. Ret : -30.438829276727496
Iteration [  391  ]
Obj. val : 41.92788985219653, Avg. Ret : -27.09131604768991
Iteration [  392  ]
Obj. val : -35.50544851561305, Avg. Ret : -31.013973961147126
Iteration [  393  ]
Obj. val : -36.6528936441518, Avg. Ret : -30.52436004640487
Iteration [  394  ]
Obj. val : -36.92959667893909, Avg. Ret : -27.294676031014657
Iteration [  395  ]
Obj. val : -37.57732090312422, Avg. Ret : -30.41900685487388
Iteration [  396  ]
Obj. val : 37.30822228184455, Avg. Ret : -31.01062440175503
Iteration [  397  ]
Obj. val : -37.343077829787326, Avg. Ret : -27.09698507006071
Iteration [  398  ]
Obj. val : -36.81028359801575, Avg. Ret : -30.51459936405101
Iteration [  399  ]
Obj. val : -36.931209778622225, Avg. Ret : -30.448072222987275
checkpoint for objective values, iteration: 400. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_2.csv
checkpoint for avg return values, iteration: 400. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_2.csv
Iteration [  400  ]
Obj. val : -37.16196224784537, Avg. Ret : -27.232747593306502
Iteration [  401  ]
Obj. val : -36.94493022270809, Avg. Ret : -30.218344252025627
Iteration [  402  ]
Obj. val : -37.56502114980034, Avg. Ret : -30.424403823566344
Iteration [  403  ]
Obj. val : 37.12692537799168, Avg. Ret : -27.15944331087727
Iteration [  404  ]
Obj. val : 36.7668395746851, Avg. Ret : -30.584467066970795
Iteration [  405  ]
Obj. val : -37.15600555984962, Avg. Ret : -30.051360408211465
Iteration [  406  ]
Obj. val : -36.73677781204437, Avg. Ret : -27.234227380988337
Iteration [  407  ]
Obj. val : 39.89681190437263, Avg. Ret : -29.951943445471215
Iteration [  408  ]
Obj. val : -37.76029808690013, Avg. Ret : -30.21607831168421
Iteration [  409  ]
Obj. val : -36.64498040407346, Avg. Ret : -27.037152898489335
Iteration [  410  ]
Obj. val : -36.66262681389556, Avg. Ret : -29.950223136889395
Iteration [  411  ]
Obj. val : -37.43718429322719, Avg. Ret : -30.074108374550242
Iteration [  412  ]
Obj. val : -36.234445388825534, Avg. Ret : -27.157636312388878
Iteration [  413  ]
Obj. val : -37.11069404735106, Avg. Ret : -30.139491213489052
Iteration [  414  ]
Obj. val : -36.69654734200497, Avg. Ret : -29.779577196131807
Iteration [  415  ]
Obj. val : 45.256261183664535, Avg. Ret : -27.521329598820866
Iteration [  416  ]
Obj. val : -37.653463872065714, Avg. Ret : -29.852967918417274
Iteration [  417  ]
Obj. val : -37.201959859247694, Avg. Ret : -29.958667050797168
Iteration [  418  ]
Obj. val : -37.03224191883103, Avg. Ret : -27.137577588675576
Iteration [  419  ]
Obj. val : -38.3833034676358, Avg. Ret : -29.628999614985705
Iteration [  420  ]
Obj. val : -37.58503980878245, Avg. Ret : -29.898724163556775
Iteration [  421  ]
Obj. val : -37.95304828578859, Avg. Ret : -25.408042166608787
Iteration [  422  ]
Obj. val : -38.6182187752423, Avg. Ret : -29.749469391333587
Iteration [  423  ]
Obj. val : -37.46834954835908, Avg. Ret : -29.65097784020496
Iteration [  424  ]
Obj. val : -38.866087579983045, Avg. Ret : -27.213391537490587
Iteration [  425  ]
Obj. val : -37.89238806372303, Avg. Ret : -29.45148429057428
Iteration [  426  ]
Obj. val : -36.396013325302235, Avg. Ret : -29.793556729249925
Iteration [  427  ]
Obj. val : 45.10692976427278, Avg. Ret : -27.435728229711447
Iteration [  428  ]
Obj. val : 56.722610655649696, Avg. Ret : -29.719594808442007
Iteration [  429  ]
Obj. val : 42.74236407040263, Avg. Ret : -29.45566088225437
Iteration [  430  ]
Obj. val : 50.90862386534764, Avg. Ret : -27.247354186087186
Iteration [  431  ]
Obj. val : -38.00768242005884, Avg. Ret : -29.511516017578334
Iteration [  432  ]
Obj. val : -37.385033566917606, Avg. Ret : -29.713409964095064
Iteration [  433  ]
Obj. val : -38.084775931729226, Avg. Ret : -27.290240489268452
Iteration [  434  ]
Obj. val : -37.34905478278058, Avg. Ret : -29.439608816797836
Iteration [  435  ]
Obj. val : -37.49853250556459, Avg. Ret : -29.309732353168965
Iteration [  436  ]
Obj. val : -38.47004110632938, Avg. Ret : -27.66876139386634
Iteration [  437  ]
Obj. val : -37.084945898904564, Avg. Ret : -29.502878341987376
Iteration [  438  ]
Obj. val : -38.19488062296294, Avg. Ret : -29.31598677090225
Iteration [  439  ]
Obj. val : -37.15895053504321, Avg. Ret : -27.42926592630121
Iteration [  440  ]
Obj. val : 36.04492187948678, Avg. Ret : -29.329162846694036
Iteration [  441  ]
Obj. val : 37.63089981814823, Avg. Ret : -29.46992180069435
Iteration [  442  ]
Obj. val : 44.03413183372963, Avg. Ret : -27.475724781039474
Iteration [  443  ]
Obj. val : 35.43138846134474, Avg. Ret : -29.21655978374762
Iteration [  444  ]
Obj. val : -36.46204270801472, Avg. Ret : -29.494915443258396
Iteration [  445  ]
Obj. val : -37.420218281081915, Avg. Ret : -27.33848599027699
Iteration [  446  ]
Obj. val : -36.2834559219388, Avg. Ret : -29.183693421590295
Iteration [  447  ]
Obj. val : 37.330919707652754, Avg. Ret : -29.271188240553624
Iteration [  448  ]
Obj. val : -38.367725470655834, Avg. Ret : -27.3257241444471
Iteration [  449  ]
Obj. val : -38.19116660825838, Avg. Ret : -29.22565747826872
Iteration [  450  ]
Obj. val : -38.49486313931489, Avg. Ret : -29.427510952091648
Iteration [  451  ]
Obj. val : -38.54567045096772, Avg. Ret : -27.49641959410581
Iteration [  452  ]
Obj. val : -38.74330882972611, Avg. Ret : -29.151746790513872
Iteration [  453  ]
Obj. val : -37.37270424167704, Avg. Ret : -29.261512156945592
Iteration [  454  ]
Obj. val : 34.3358284400154, Avg. Ret : -27.233261070745655
Iteration [  455  ]
Obj. val : 45.06483367756255, Avg. Ret : -29.052645547749677
Iteration [  456  ]
Obj. val : -38.48673406237573, Avg. Ret : -29.368528315893784
Iteration [  457  ]
Obj. val : -38.59468842744025, Avg. Ret : -27.391676521898408
Iteration [  458  ]
Obj. val : -39.051497855328, Avg. Ret : -29.340938506507026
Iteration [  459  ]
Obj. val : -38.06116537129863, Avg. Ret : -29.099570942841833
Iteration [  460  ]
Obj. val : 34.57610988805705, Avg. Ret : -27.4574373931889
Iteration [  461  ]
Obj. val : 39.921695175481304, Avg. Ret : -29.106677570332568
Iteration [  462  ]
Obj. val : 35.07756228979272, Avg. Ret : -29.327294702841687
Iteration [  463  ]
Obj. val : 38.149609262237995, Avg. Ret : -27.58744342354588
Iteration [  464  ]
Obj. val : 39.23896638563837, Avg. Ret : -29.00703825158718
Iteration [  465  ]
Obj. val : -38.142309851644306, Avg. Ret : -29.510867974883446
Iteration [  466  ]
Obj. val : 37.138771066953176, Avg. Ret : -27.586528257699296
Iteration [  467  ]
Obj. val : -39.17432347020135, Avg. Ret : -29.15677001731004
Iteration [  468  ]
Obj. val : 62.71608100279642, Avg. Ret : -29.12351862090824
Iteration [  469  ]
Obj. val : -38.769421475320584, Avg. Ret : -27.353136481866485
Iteration [  470  ]
Obj. val : 39.52867622135701, Avg. Ret : -29.002786113153704
Iteration [  471  ]
Obj. val : 37.40745161738265, Avg. Ret : -29.196570112435037
Iteration [  472  ]
Obj. val : -38.55644270309243, Avg. Ret : -27.669143958710183
Iteration [  473  ]
Obj. val : 49.64632553951685, Avg. Ret : -28.893324010858237
Iteration [  474  ]
Obj. val : 39.19154415368055, Avg. Ret : -28.951628682847858
Iteration [  475  ]
Obj. val : 40.22006804064064, Avg. Ret : -27.334036618200965
Iteration [  476  ]
Obj. val : -38.30256322393593, Avg. Ret : -28.868675336527975
Iteration [  477  ]
Obj. val : -39.29973503435807, Avg. Ret : -28.896074048364003
Iteration [  478  ]
Obj. val : -37.66846787855664, Avg. Ret : -27.220870721363003
Iteration [  479  ]
Obj. val : -39.017530002186724, Avg. Ret : -28.85731139048335
Iteration [  480  ]
Obj. val : -38.145526112079004, Avg. Ret : -29.160485117188795
Iteration [  481  ]
Obj. val : 36.7040051337351, Avg. Ret : -27.606792166222753
Iteration [  482  ]
Obj. val : -37.23521683236569, Avg. Ret : -29.23230450003565
Iteration [  483  ]
Obj. val : -39.10702857907418, Avg. Ret : -29.300903519746363
Iteration [  484  ]
Obj. val : -37.562023529943566, Avg. Ret : -27.5215458525146
Iteration [  485  ]
Obj. val : 36.24685173214455, Avg. Ret : -28.970322153886524
Iteration [  486  ]
Obj. val : -38.84570234594709, Avg. Ret : -28.968682719666177
Iteration [  487  ]
Obj. val : -37.76874297977213, Avg. Ret : -27.308984059627672
Iteration [  488  ]
Obj. val : 41.593373033624765, Avg. Ret : -28.889689894497355
Iteration [  489  ]
Obj. val : -39.97941032261762, Avg. Ret : -28.925841040016167
Iteration [  490  ]
Obj. val : -36.540376953926966, Avg. Ret : -27.6117343351888
Iteration [  491  ]
Obj. val : 38.902831791867904, Avg. Ret : -28.84303050726807
Iteration [  492  ]
Obj. val : -36.2604633923838, Avg. Ret : -28.93135887368425
Iteration [  493  ]
Obj. val : -37.960055394637564, Avg. Ret : -27.401350058454632
Iteration [  494  ]
Obj. val : 33.69425639332352, Avg. Ret : -29.070237071114025
Iteration [  495  ]
Obj. val : -37.83722443288189, Avg. Ret : -28.89244982416799
Iteration [  496  ]
Obj. val : 58.980121160544854, Avg. Ret : -27.346123995959097
Iteration [  497  ]
Obj. val : 34.87732278403567, Avg. Ret : -29.042004155909268
Iteration [  498  ]
Obj. val : -39.099391857259285, Avg. Ret : -28.94640996827776
Iteration [  499  ]
Obj. val : -38.61782535376723, Avg. Ret : -27.41691172619624
checkpoint for objective values, iteration: 500. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_2.csv
checkpoint for objective values, iteration: 500. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_2.csv
batch = 3
inside iterator
Iteration [  0  ]
Obj. val : -23.363064000109997, Avg. Ret : -18.186321925506164
Iteration [  1  ]
Obj. val : -22.99709201891626, Avg. Ret : -18.221396089485214
Iteration [  2  ]
Obj. val : -23.25943239804585, Avg. Ret : -18.152055028399182
Iteration [  3  ]
Obj. val : -22.661598315541166, Avg. Ret : -18.127499397587407
Iteration [  4  ]
Obj. val : -22.584551322370856, Avg. Ret : -18.322691430737834
Iteration [  5  ]
Obj. val : -22.823751312399157, Avg. Ret : -18.29828205802528
Iteration [  6  ]
Obj. val : -22.28686641487743, Avg. Ret : -18.311213814523843
Iteration [  7  ]
Obj. val : -22.448195305871042, Avg. Ret : -18.052815729501347
Iteration [  8  ]
Obj. val : -22.951046861504366, Avg. Ret : -18.097014960684547
Iteration [  9  ]
Obj. val : -22.292835874535147, Avg. Ret : -18.085898003358103
Iteration [  10  ]
Obj. val : -22.553877072639946, Avg. Ret : -18.280880925551692
Iteration [  11  ]
Obj. val : -22.119130011763534, Avg. Ret : -18.273853998294037
Iteration [  12  ]
Obj. val : -22.095171037264137, Avg. Ret : -18.089872846229742
Iteration [  13  ]
Obj. val : -22.661144808818168, Avg. Ret : -18.274089842716503
Iteration [  14  ]
Obj. val : -22.398619909503005, Avg. Ret : -18.11562665358357
Iteration [  15  ]
Obj. val : -22.709412466004355, Avg. Ret : -18.198524503863315
Iteration [  16  ]
Obj. val : -22.336576468775313, Avg. Ret : -18.21099513720063
Iteration [  17  ]
Obj. val : -22.30711926959074, Avg. Ret : -18.223507848728772
Iteration [  18  ]
Obj. val : -21.763442203165017, Avg. Ret : -18.395483071532325
Iteration [  19  ]
Obj. val : -21.11934116639715, Avg. Ret : -18.544750829296213
Iteration [  20  ]
Obj. val : -21.595737807361854, Avg. Ret : -34.86664455933908
Iteration [  21  ]
Obj. val : -22.05591465142337, Avg. Ret : -45.18250426307966
Iteration [  22  ]
Obj. val : -21.621080065329704, Avg. Ret : -17.137961811551442
Iteration [  23  ]
Obj. val : -21.945601608432085, Avg. Ret : -30.11091194683787
Iteration [  24  ]
Obj. val : -21.451797919042967, Avg. Ret : -25.39976786130004
Iteration [  25  ]
Obj. val : -20.878539235483323, Avg. Ret : -18.772664317194245
Iteration [  26  ]
Obj. val : -21.280006471234113, Avg. Ret : -23.694434469027073
Iteration [  27  ]
Obj. val : -21.32418834556898, Avg. Ret : -16.690984856334673
Iteration [  28  ]
Obj. val : -21.414013049791198, Avg. Ret : -15.916252920372445
Iteration [  29  ]
Obj. val : -21.35891682072652, Avg. Ret : -22.521496281130776
Iteration [  30  ]
Obj. val : -21.782952863606994, Avg. Ret : -21.88241262026801
Iteration [  31  ]
Obj. val : -20.970621013502644, Avg. Ret : -15.758780666544887
Iteration [  32  ]
Obj. val : -21.199456245328726, Avg. Ret : -15.972181963631783
Iteration [  33  ]
Obj. val : -21.219645416499134, Avg. Ret : -21.5211089813593
Iteration [  34  ]
Obj. val : -21.1846302222288, Avg. Ret : -16.245634506258078
Iteration [  35  ]
Obj. val : -21.05367582341188, Avg. Ret : -21.203994497164995
Iteration [  36  ]
Obj. val : -20.987335335500934, Avg. Ret : -20.765852100004736
Iteration [  37  ]
Obj. val : -20.329192064250893, Avg. Ret : -16.50380384057261
Iteration [  38  ]
Obj. val : -21.31309827432013, Avg. Ret : -20.447983616037
Iteration [  39  ]
Obj. val : 54.509985251739245, Avg. Ret : -16.620861033395496
Iteration [  40  ]
Obj. val : -20.493043718465486, Avg. Ret : -24.85842230270691
Iteration [  41  ]
Obj. val : 53.90843568259387, Avg. Ret : -18.813254985585107
Iteration [  42  ]
Obj. val : -20.701015226997335, Avg. Ret : -17.38020861835889
Iteration [  43  ]
Obj. val : -20.65181474380947, Avg. Ret : -24.724374081559553
Iteration [  44  ]
Obj. val : -20.858523916757207, Avg. Ret : -18.815007592072305
Iteration [  45  ]
Obj. val : -20.62619575766675, Avg. Ret : -17.04699697085073
Iteration [  46  ]
Obj. val : -20.832823755977273, Avg. Ret : -24.571475675601434
Iteration [  47  ]
Obj. val : -20.743216778144248, Avg. Ret : -18.51802099726974
Iteration [  48  ]
Obj. val : -20.295191941721725, Avg. Ret : -17.13603679961977
Iteration [  49  ]
Obj. val : -20.800299807575772, Avg. Ret : -24.41652926191781
Iteration [  50  ]
Obj. val : -20.050215779532866, Avg. Ret : -17.304389011874576
Iteration [  51  ]
Obj. val : -20.568231962098707, Avg. Ret : -18.32292399872448
Iteration [  52  ]
Obj. val : -20.387454715762544, Avg. Ret : -24.526517003971186
Iteration [  53  ]
Obj. val : -20.198404851593565, Avg. Ret : -18.368406616607164
Iteration [  54  ]
Obj. val : -20.49715374054272, Avg. Ret : -17.268761217737488
Iteration [  55  ]
Obj. val : -19.644956718149086, Avg. Ret : -24.25805461923167
Iteration [  56  ]
Obj. val : -20.371877680988685, Avg. Ret : -17.944615236012613
Iteration [  57  ]
Obj. val : -19.91813030920514, Avg. Ret : -17.23435097334525
Iteration [  58  ]
Obj. val : -19.949883076399676, Avg. Ret : -24.467602402310817
Iteration [  59  ]
Obj. val : -19.116406274456004, Avg. Ret : -17.130516032816463
Iteration [  60  ]
Obj. val : -19.530623339681895, Avg. Ret : -17.956395518523912
Iteration [  61  ]
Obj. val : -19.98907483432455, Avg. Ret : -24.415846930254876
Iteration [  62  ]
Obj. val : -19.90015093458287, Avg. Ret : -17.85438488452334
Iteration [  63  ]
Obj. val : -19.896468584377242, Avg. Ret : -17.22141168840659
Iteration [  64  ]
Obj. val : -20.236071068028398, Avg. Ret : -24.35738796110708
Iteration [  65  ]
Obj. val : -19.59087688015695, Avg. Ret : -17.616411319872054
Iteration [  66  ]
Obj. val : -20.186046208475158, Avg. Ret : -17.22627815356527
Iteration [  67  ]
Obj. val : -19.735749841983377, Avg. Ret : -24.274916267903983
Iteration [  68  ]
Obj. val : -19.310210179319416, Avg. Ret : -17.05643865476067
Iteration [  69  ]
Obj. val : -19.477311543665756, Avg. Ret : -17.890816340099615
Iteration [  70  ]
Obj. val : -19.245289160810504, Avg. Ret : -24.173387696773144
Iteration [  71  ]
Obj. val : -19.426755957732645, Avg. Ret : -17.725404317852878
Iteration [  72  ]
Obj. val : -19.365545544897223, Avg. Ret : -17.31655658762731
Iteration [  73  ]
Obj. val : -19.981138392082112, Avg. Ret : -24.192916200517065
Iteration [  74  ]
Obj. val : 51.97635656757949, Avg. Ret : -17.637519937291387
Iteration [  75  ]
Obj. val : -19.29619914011383, Avg. Ret : -17.079756964705137
Iteration [  76  ]
Obj. val : -19.256021858330275, Avg. Ret : -24.184311589533504
Iteration [  77  ]
Obj. val : -19.458576585841932, Avg. Ret : -16.944663979409977
Iteration [  78  ]
Obj. val : -18.795498144723638, Avg. Ret : -17.446593484626856
Iteration [  79  ]
Obj. val : -19.410342807657017, Avg. Ret : -24.047367715119535
Iteration [  80  ]
Obj. val : -18.824696600480387, Avg. Ret : -17.3753404721224
Iteration [  81  ]
Obj. val : -19.253143088581446, Avg. Ret : -17.00909905704014
Iteration [  82  ]
Obj. val : -18.9702852281573, Avg. Ret : -23.874509948682483
Iteration [  83  ]
Obj. val : -18.842287247733786, Avg. Ret : -17.104975065216035
Iteration [  84  ]
Obj. val : -19.027758644092803, Avg. Ret : -17.55457892014105
Iteration [  85  ]
Obj. val : -18.778464946062297, Avg. Ret : -24.0737255565263
Iteration [  86  ]
Obj. val : -19.081281551984247, Avg. Ret : -16.95400943025744
Iteration [  87  ]
Obj. val : -19.194219113382548, Avg. Ret : -17.226037008954915
Iteration [  88  ]
Obj. val : -19.209455696600322, Avg. Ret : -23.754104282178186
Iteration [  89  ]
Obj. val : -18.638593221866937, Avg. Ret : -17.322319391659242
Iteration [  90  ]
Obj. val : -18.65893486881163, Avg. Ret : -16.90963147496519
Iteration [  91  ]
Obj. val : -18.85462513161404, Avg. Ret : -23.71365618596643
Iteration [  92  ]
Obj. val : -18.75093994736305, Avg. Ret : -17.118000855694866
Iteration [  93  ]
Obj. val : -18.921732586667428, Avg. Ret : -17.3288138531238
Iteration [  94  ]
Obj. val : -18.536524012602335, Avg. Ret : -23.527301785527712
Iteration [  95  ]
Obj. val : -18.474290229087238, Avg. Ret : -17.48326687505666
Iteration [  96  ]
Obj. val : -18.31650590442732, Avg. Ret : -16.893998280989376
Iteration [  97  ]
Obj. val : -17.899345003043685, Avg. Ret : -23.568805042253967
Iteration [  98  ]
Obj. val : -18.787717829817527, Avg. Ret : -16.595256874400413
Iteration [  99  ]
Obj. val : -18.090334592887753, Avg. Ret : -17.452098268169426
checkpoint for objective values, iteration: 100. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_3.csv
checkpoint for avg return values, iteration: 100. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_3.csv
Iteration [  100  ]
Obj. val : -18.456046524439266, Avg. Ret : -23.5244183124201
Iteration [  101  ]
Obj. val : -17.80908860446643, Avg. Ret : -17.579390000592838
Iteration [  102  ]
Obj. val : -18.45973300980912, Avg. Ret : -16.71419598952174
Iteration [  103  ]
Obj. val : -18.288727070967756, Avg. Ret : -23.46013822161037
Iteration [  104  ]
Obj. val : -17.848316396821517, Avg. Ret : -16.616903781035973
Iteration [  105  ]
Obj. val : -18.496361527900966, Avg. Ret : -17.5782643023784
Iteration [  106  ]
Obj. val : -18.573005522011144, Avg. Ret : -23.462893835700616
Iteration [  107  ]
Obj. val : -18.262641375005284, Avg. Ret : -16.73049316956514
Iteration [  108  ]
Obj. val : -18.003581058054387, Avg. Ret : -17.492977423648725
Iteration [  109  ]
Obj. val : -18.18296446141599, Avg. Ret : -23.464002826242265
Iteration [  110  ]
Obj. val : -18.00423798885411, Avg. Ret : -16.30075583534797
Iteration [  111  ]
Obj. val : -17.63873877821348, Avg. Ret : -17.542591312927353
Iteration [  112  ]
Obj. val : -17.774397433760594, Avg. Ret : -23.196129987265763
Iteration [  113  ]
Obj. val : -18.145512127357872, Avg. Ret : -16.200664193274086
Iteration [  114  ]
Obj. val : -18.18555598855569, Avg. Ret : -17.906980730174936
Iteration [  115  ]
Obj. val : -17.7724538556584, Avg. Ret : -23.130161157031196
Iteration [  116  ]
Obj. val : -17.70301559519555, Avg. Ret : -17.86902359452945
Iteration [  117  ]
Obj. val : -18.090440057555274, Avg. Ret : -16.25766481697476
Iteration [  118  ]
Obj. val : -17.80204843958585, Avg. Ret : -23.110666381647352
Iteration [  119  ]
Obj. val : -17.85983343886709, Avg. Ret : -16.458284869161517
Iteration [  120  ]
Obj. val : -17.89998716889036, Avg. Ret : -17.458329358125958
Iteration [  121  ]
Obj. val : -17.349418950307665, Avg. Ret : -23.076951776965803
Iteration [  122  ]
Obj. val : -17.770927766516962, Avg. Ret : -16.012284115558646
Iteration [  123  ]
Obj. val : -17.80517288098679, Avg. Ret : -17.587253758036447
Iteration [  124  ]
Obj. val : -17.9855267862851, Avg. Ret : -23.042003429329853
Iteration [  125  ]
Obj. val : -18.017354148636834, Avg. Ret : -17.512645276706937
Iteration [  126  ]
Obj. val : -17.653921663812476, Avg. Ret : -16.250879838910933
Iteration [  127  ]
Obj. val : -17.473598190761404, Avg. Ret : -22.925731423338203
Iteration [  128  ]
Obj. val : -17.225459980660343, Avg. Ret : -16.457012588833308
Iteration [  129  ]
Obj. val : -17.16262751714838, Avg. Ret : -17.5498106421166
Iteration [  130  ]
Obj. val : -17.43692658890569, Avg. Ret : -23.100860121463388
Iteration [  131  ]
Obj. val : -17.4378463690499, Avg. Ret : -17.54998163595029
Iteration [  132  ]
Obj. val : -17.576111356365537, Avg. Ret : -16.017084195380285
Iteration [  133  ]
Obj. val : -17.518081198422568, Avg. Ret : -22.93452573547563
Iteration [  134  ]
Obj. val : -16.85800154323739, Avg. Ret : -16.401333298148337
Iteration [  135  ]
Obj. val : -16.858111430648847, Avg. Ret : -17.35188137797796
Iteration [  136  ]
Obj. val : -16.93147738518476, Avg. Ret : -22.66391497596885
Iteration [  137  ]
Obj. val : -17.204405764137885, Avg. Ret : -16.297326534086885
Iteration [  138  ]
Obj. val : -17.250325493554897, Avg. Ret : -17.338362271404318
Iteration [  139  ]
Obj. val : -17.3368429134905, Avg. Ret : -22.790475775621097
Iteration [  140  ]
Obj. val : -17.014450537878467, Avg. Ret : -16.30877089342191
Iteration [  141  ]
Obj. val : -17.368603635499852, Avg. Ret : -17.395870390187394
Iteration [  142  ]
Obj. val : -16.90384025685436, Avg. Ret : -22.650685610455042
Iteration [  143  ]
Obj. val : -17.052518458364705, Avg. Ret : -16.195794470693716
Iteration [  144  ]
Obj. val : -16.932181409884727, Avg. Ret : -17.54794740323012
Iteration [  145  ]
Obj. val : -16.784164807573116, Avg. Ret : -22.732177965666082
Iteration [  146  ]
Obj. val : -16.795746470018724, Avg. Ret : -17.296687479602
Iteration [  147  ]
Obj. val : -16.919139064509082, Avg. Ret : -16.1311117226515
Iteration [  148  ]
Obj. val : -17.240933530526256, Avg. Ret : -22.71557334132206
Iteration [  149  ]
Obj. val : -16.70653474440602, Avg. Ret : -17.431091591513404
Iteration [  150  ]
Obj. val : -16.725925262297086, Avg. Ret : -16.18206309675902
Iteration [  151  ]
Obj. val : -16.524792255803074, Avg. Ret : -22.196099787109375
Iteration [  152  ]
Obj. val : -16.503206113518708, Avg. Ret : -17.48556479824994
Iteration [  153  ]
Obj. val : -17.076571018558212, Avg. Ret : -16.151788037265984
Iteration [  154  ]
Obj. val : -16.587362119502856, Avg. Ret : -22.620156817384782
Iteration [  155  ]
Obj. val : -16.414416352997378, Avg. Ret : -17.351238442391683
Iteration [  156  ]
Obj. val : -16.616736728874404, Avg. Ret : -16.336309937049933
Iteration [  157  ]
Obj. val : -16.258855366906513, Avg. Ret : -20.56084351004771
Iteration [  158  ]
Obj. val : -16.77984590374053, Avg. Ret : -17.59716989754459
Iteration [  159  ]
Obj. val : -16.256328242054916, Avg. Ret : -15.930886197032336
Iteration [  160  ]
Obj. val : -16.462639710463428, Avg. Ret : -22.244852009050547
Iteration [  161  ]
Obj. val : -15.87440792076765, Avg. Ret : -17.040948949995258
Iteration [  162  ]
Obj. val : -16.28789256009523, Avg. Ret : -16.21092146455118
Iteration [  163  ]
Obj. val : -16.74789565427734, Avg. Ret : -20.121550936994023
Iteration [  164  ]
Obj. val : -16.402872422808578, Avg. Ret : -16.93529235966652
Iteration [  165  ]
Obj. val : -16.45542383298118, Avg. Ret : -16.326057064941537
Iteration [  166  ]
Obj. val : -15.633101074452856, Avg. Ret : -22.100805266084425
Iteration [  167  ]
Obj. val : -16.093545804021687, Avg. Ret : -16.20449436319303
Iteration [  168  ]
Obj. val : -16.666242805286437, Avg. Ret : -16.949761399314536
Iteration [  169  ]
Obj. val : -16.0291758596904, Avg. Ret : -22.248222958554223
Iteration [  170  ]
Obj. val : -16.392136096037884, Avg. Ret : -16.878166688849436
Iteration [  171  ]
Obj. val : -16.061314608573962, Avg. Ret : -16.255241989248464
Iteration [  172  ]
Obj. val : -15.646125830764202, Avg. Ret : -22.20947642947924
Iteration [  173  ]
Obj. val : -16.306735173057024, Avg. Ret : -17.040806188208162
Iteration [  174  ]
Obj. val : -16.04192323294422, Avg. Ret : -16.030590141146178
Iteration [  175  ]
Obj. val : -16.07640801915577, Avg. Ret : -22.217813327615936
Iteration [  176  ]
Obj. val : -16.005071064226197, Avg. Ret : -17.343440558934514
Iteration [  177  ]
Obj. val : -16.115178291913836, Avg. Ret : -16.02457476808802
Iteration [  178  ]
Obj. val : -16.065528479915955, Avg. Ret : -22.161738564906628
Iteration [  179  ]
Obj. val : -15.913222220705345, Avg. Ret : -15.787099084449242
Iteration [  180  ]
Obj. val : -16.14300244076292, Avg. Ret : -17.550446536409293
Iteration [  181  ]
Obj. val : -16.275073491122058, Avg. Ret : -22.118305928633777
Iteration [  182  ]
Obj. val : -15.9059457602688, Avg. Ret : -17.296883643024877
Iteration [  183  ]
Obj. val : -15.374565701015381, Avg. Ret : -15.996021748597222
Iteration [  184  ]
Obj. val : -15.960267588744625, Avg. Ret : -21.95351549440992
Iteration [  185  ]
Obj. val : -15.609467995577743, Avg. Ret : -17.233990414074775
Iteration [  186  ]
Obj. val : -15.491869599615391, Avg. Ret : -16.06418754229439
Iteration [  187  ]
Obj. val : -16.07705575877046, Avg. Ret : -22.19038407425117
Iteration [  188  ]
Obj. val : -15.876810235476125, Avg. Ret : -15.92501440891004
Iteration [  189  ]
Obj. val : -16.17320343708157, Avg. Ret : -16.861201580739205
Iteration [  190  ]
Obj. val : -15.957400907332199, Avg. Ret : -21.92390104032187
Iteration [  191  ]
Obj. val : -15.308379601382892, Avg. Ret : -17.158471294882425
Iteration [  192  ]
Obj. val : -15.560917963277303, Avg. Ret : -15.869667349295364
Iteration [  193  ]
Obj. val : -15.91188795268858, Avg. Ret : -21.99104253774401
Iteration [  194  ]
Obj. val : -15.596246171306479, Avg. Ret : -15.800377302111698
Iteration [  195  ]
Obj. val : -15.117303640219731, Avg. Ret : -16.8105210419167
Iteration [  196  ]
Obj. val : -15.446328093806425, Avg. Ret : -21.853431225339943
Iteration [  197  ]
Obj. val : -15.259596000161281, Avg. Ret : -15.972768589266414
Iteration [  198  ]
Obj. val : -15.779295551093565, Avg. Ret : -16.822500741933833
Iteration [  199  ]
Obj. val : -15.034919140776386, Avg. Ret : -21.702581808130113
checkpoint for objective values, iteration: 200. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_3.csv
checkpoint for avg return values, iteration: 200. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_3.csv
Iteration [  200  ]
Obj. val : -15.627600660494368, Avg. Ret : -16.037471652475308
Iteration [  201  ]
Obj. val : -15.330514930875333, Avg. Ret : -16.664624332844152
Iteration [  202  ]
Obj. val : -15.93345799916919, Avg. Ret : -21.583230089962722
Iteration [  203  ]
Obj. val : -15.391329035270752, Avg. Ret : -16.623339822328106
Iteration [  204  ]
Obj. val : -15.110272762198637, Avg. Ret : -16.052454877231707
Iteration [  205  ]
Obj. val : -15.318539958823408, Avg. Ret : -21.61227540718744
Iteration [  206  ]
Obj. val : -15.31289968635099, Avg. Ret : -15.850244193575453
Iteration [  207  ]
Obj. val : -15.301607005199585, Avg. Ret : -16.756964691480032
Iteration [  208  ]
Obj. val : -15.558538280452213, Avg. Ret : -21.757908121313562
Iteration [  209  ]
Obj. val : -14.94378042907134, Avg. Ret : -16.794143752404086
Iteration [  210  ]
Obj. val : -15.563764037209493, Avg. Ret : -15.943639548506065
Iteration [  211  ]
Obj. val : -15.235451049017081, Avg. Ret : -21.658022157571327
Iteration [  212  ]
Obj. val : -15.652161588870976, Avg. Ret : -15.87588770476323
Iteration [  213  ]
Obj. val : -14.97064973061501, Avg. Ret : -16.714160872504344
Iteration [  214  ]
Obj. val : -14.867236086758352, Avg. Ret : -21.44800699610163
Iteration [  215  ]
Obj. val : -15.09400649647727, Avg. Ret : -16.58295981027409
Iteration [  216  ]
Obj. val : -15.601251279384837, Avg. Ret : -15.843062836186881
Iteration [  217  ]
Obj. val : -15.257996475891945, Avg. Ret : -21.298236888177552
Iteration [  218  ]
Obj. val : -15.107737393757873, Avg. Ret : -16.95033502612516
Iteration [  219  ]
Obj. val : -15.246524205540505, Avg. Ret : -15.84827099878055
Iteration [  220  ]
Obj. val : -15.202317337225162, Avg. Ret : -21.402673094857832
Iteration [  221  ]
Obj. val : -15.019806902354535, Avg. Ret : -15.850430536081229
Iteration [  222  ]
Obj. val : -14.848759141004358, Avg. Ret : -16.932497501759112
Iteration [  223  ]
Obj. val : -15.377051221478354, Avg. Ret : -21.244560581835625
Iteration [  224  ]
Obj. val : -15.550424051240261, Avg. Ret : -15.64129229062355
Iteration [  225  ]
Obj. val : -15.341929621306518, Avg. Ret : -16.679772991699732
Iteration [  226  ]
Obj. val : -14.84622560919509, Avg. Ret : -21.39714879310288
Iteration [  227  ]
Obj. val : 56.47835896266794, Avg. Ret : -16.354043320390335
Iteration [  228  ]
Obj. val : -15.05199050810771, Avg. Ret : -15.837343452989929
Iteration [  229  ]
Obj. val : -15.335856590856702, Avg. Ret : -21.386477017673684
Iteration [  230  ]
Obj. val : -15.574819024910008, Avg. Ret : -16.598043916513333
Iteration [  231  ]
Obj. val : -15.555127771276226, Avg. Ret : -15.688800732212322
Iteration [  232  ]
Obj. val : -15.374348069963448, Avg. Ret : -21.515365636960826
Iteration [  233  ]
Obj. val : -15.561606425145238, Avg. Ret : -15.8798943120296
Iteration [  234  ]
Obj. val : -15.448382375556841, Avg. Ret : -16.650407133886052
Iteration [  235  ]
Obj. val : -15.34656747110037, Avg. Ret : -21.185599936165808
Iteration [  236  ]
Obj. val : -15.757560111624022, Avg. Ret : -16.571008122520606
Iteration [  237  ]
Obj. val : -15.569882092138204, Avg. Ret : -15.755399969439097
Iteration [  238  ]
Obj. val : -15.653661119910897, Avg. Ret : -21.2984902858529
Iteration [  239  ]
Obj. val : -15.567918342223525, Avg. Ret : -15.700510116169049
Iteration [  240  ]
Obj. val : -15.548131385289793, Avg. Ret : -16.859183792811297
Iteration [  241  ]
Obj. val : -15.5893127771582, Avg. Ret : -21.356732805456353
Iteration [  242  ]
Obj. val : -15.47272717113294, Avg. Ret : -15.478728240107623
Iteration [  243  ]
Obj. val : -15.999972457962542, Avg. Ret : -16.949390974669576
Iteration [  244  ]
Obj. val : -15.53505547161323, Avg. Ret : -21.05906229316037
Iteration [  245  ]
Obj. val : -16.046975891523676, Avg. Ret : -15.676003391067331
Iteration [  246  ]
Obj. val : -15.858497569594194, Avg. Ret : -17.69514807815736
Iteration [  247  ]
Obj. val : -15.871397544339757, Avg. Ret : -21.1376887060101
Iteration [  248  ]
Obj. val : -16.224252469639826, Avg. Ret : -15.610387206252765
Iteration [  249  ]
Obj. val : -16.058922277250904, Avg. Ret : -17.022243502411044
Iteration [  250  ]
Obj. val : -16.255278650132, Avg. Ret : -20.81139300585458
Iteration [  251  ]
Obj. val : 57.94550694065407, Avg. Ret : -15.442157089671671
Iteration [  252  ]
Obj. val : -16.48947704150192, Avg. Ret : -17.117664704298203
Iteration [  253  ]
Obj. val : -16.515117111922304, Avg. Ret : -20.977967385084852
Iteration [  254  ]
Obj. val : -16.6521357082694, Avg. Ret : -15.46961072784989
Iteration [  255  ]
Obj. val : -16.26556064390906, Avg. Ret : -16.633216261586103
Iteration [  256  ]
Obj. val : -16.25957437033658, Avg. Ret : -20.781711550944543
Iteration [  257  ]
Obj. val : -16.939997405811578, Avg. Ret : -15.259436606786716
Iteration [  258  ]
Obj. val : -16.221427589561497, Avg. Ret : -17.14472995055035
Iteration [  259  ]
Obj. val : -16.667993046428833, Avg. Ret : -21.08937842648257
Iteration [  260  ]
Obj. val : -16.20598916905707, Avg. Ret : -15.191231059282675
Iteration [  261  ]
Obj. val : -17.10008162074317, Avg. Ret : -17.13078020634698
Iteration [  262  ]
Obj. val : -16.835408709780584, Avg. Ret : -18.789074076425287
Iteration [  263  ]
Obj. val : -16.934705294544624, Avg. Ret : -17.08969538933755
Iteration [  264  ]
Obj. val : -16.812033528303783, Avg. Ret : -15.524300414930604
Iteration [  265  ]
Obj. val : -17.28181791527425, Avg. Ret : -20.765596124574802
Iteration [  266  ]
Obj. val : -17.460449886271913, Avg. Ret : -15.1585740835972
Iteration [  267  ]
Obj. val : -17.562915243649716, Avg. Ret : -17.043074382669495
Iteration [  268  ]
Obj. val : -17.2381673706898, Avg. Ret : -20.82142921053876
Iteration [  269  ]
Obj. val : -16.839227821936422, Avg. Ret : -15.454303274966213
Iteration [  270  ]
Obj. val : -17.743410038059803, Avg. Ret : -16.536559947057086
Iteration [  271  ]
Obj. val : 55.31151550776221, Avg. Ret : -20.681009045682735
Iteration [  272  ]
Obj. val : 55.720449326849, Avg. Ret : -16.192775658812565
Iteration [  273  ]
Obj. val : -17.388119709014266, Avg. Ret : -15.54795861959451
Iteration [  274  ]
Obj. val : 54.715855497652846, Avg. Ret : -20.549629172263504
Iteration [  275  ]
Obj. val : -17.599940724891887, Avg. Ret : -15.777843444178007
Iteration [  276  ]
Obj. val : -17.324838556209077, Avg. Ret : -16.143089110420576
Iteration [  277  ]
Obj. val : 53.988880943608926, Avg. Ret : -20.885263180178
Iteration [  278  ]
Obj. val : 52.42378975613947, Avg. Ret : -16.21549861236172
Iteration [  279  ]
Obj. val : -17.318948692110247, Avg. Ret : -15.567821236741029
Iteration [  280  ]
Obj. val : 75.32794478878299, Avg. Ret : -20.536152269808053
Iteration [  281  ]
Obj. val : -17.8453298391375, Avg. Ret : -15.307764820630334
Iteration [  282  ]
Obj. val : 53.36795678251389, Avg. Ret : -16.39276180071057
Iteration [  283  ]
Obj. val : 53.52027132274554, Avg. Ret : -20.544634541586063
Iteration [  284  ]
Obj. val : 53.95254202351817, Avg. Ret : -16.17783437301793
Iteration [  285  ]
Obj. val : 76.98011218069422, Avg. Ret : -15.286963304032847
Iteration [  286  ]
Obj. val : -17.761117988436283, Avg. Ret : -20.500809851187103
Iteration [  287  ]
Obj. val : 66.57340951058045, Avg. Ret : -15.829673843661437
Iteration [  288  ]
Obj. val : -18.07829235436519, Avg. Ret : -16.058818703290004
Iteration [  289  ]
Obj. val : 52.942373308897956, Avg. Ret : -20.350295725493893
Iteration [  290  ]
Obj. val : -17.892656105037624, Avg. Ret : -15.395576987430186
Iteration [  291  ]
Obj. val : -17.834584822103448, Avg. Ret : -16.190869344617788
Iteration [  292  ]
Obj. val : 53.508943107047116, Avg. Ret : -20.642592177725366
Iteration [  293  ]
Obj. val : 73.504213733778, Avg. Ret : -15.82863719226318
Iteration [  294  ]
Obj. val : 63.44779258634964, Avg. Ret : -15.402566568453908
Iteration [  295  ]
Obj. val : 80.19532039617164, Avg. Ret : -20.326009708303115
Iteration [  296  ]
Obj. val : 64.1701006327335, Avg. Ret : -16.19827969947051
Iteration [  297  ]
Obj. val : 53.39490817336718, Avg. Ret : -15.511929929252926
Iteration [  298  ]
Obj. val : 65.56576773717691, Avg. Ret : -20.34642674778907
Iteration [  299  ]
Obj. val : 51.79937061858408, Avg. Ret : -15.261739949312796
checkpoint for objective values, iteration: 300. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_3.csv
checkpoint for avg return values, iteration: 300. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_3.csv
Iteration [  300  ]
Obj. val : 74.12074719156342, Avg. Ret : -16.06050636769557
Iteration [  301  ]
Obj. val : 71.9216729168666, Avg. Ret : -20.3684013174906
Iteration [  302  ]
Obj. val : 72.93609641472833, Avg. Ret : -15.287351933472978
Iteration [  303  ]
Obj. val : -18.13723011645637, Avg. Ret : -16.165315133112458
Iteration [  304  ]
Obj. val : 54.90007970541298, Avg. Ret : -20.29125722848308
Iteration [  305  ]
Obj. val : 63.75312868371045, Avg. Ret : -15.963455862922638
Iteration [  306  ]
Obj. val : 73.58432835465341, Avg. Ret : -15.405415705167211
Iteration [  307  ]
Obj. val : 72.49807733227821, Avg. Ret : -20.19078182837507
Iteration [  308  ]
Obj. val : 68.00893666242648, Avg. Ret : -16.15399839490131
Iteration [  309  ]
Obj. val : -18.113397209262235, Avg. Ret : -15.32746446147968
Iteration [  310  ]
Obj. val : -17.94507427250683, Avg. Ret : -20.112844056257032
Iteration [  311  ]
Obj. val : 65.64619726706185, Avg. Ret : -16.25720475246532
Iteration [  312  ]
Obj. val : 82.05252726830136, Avg. Ret : -15.473817457446703
Iteration [  313  ]
Obj. val : 66.6381187816167, Avg. Ret : -20.388167642550794
Iteration [  314  ]
Obj. val : 77.32838322157691, Avg. Ret : -15.236755239968954
Iteration [  315  ]
Obj. val : 80.93871565714204, Avg. Ret : -16.083947564312695
Iteration [  316  ]
Obj. val : 81.9655838075408, Avg. Ret : -20.09449060667711
Iteration [  317  ]
Obj. val : 63.57284209489995, Avg. Ret : -15.18341451850623
Iteration [  318  ]
Obj. val : 70.88731906390485, Avg. Ret : -15.940479128864835
Iteration [  319  ]
Obj. val : 82.81222814667197, Avg. Ret : -20.020747368790254
Iteration [  320  ]
Obj. val : 80.41711697140627, Avg. Ret : -15.190572155464942
Iteration [  321  ]
Obj. val : 77.45259556607206, Avg. Ret : -15.816420306454754
Iteration [  322  ]
Obj. val : 80.91775951403052, Avg. Ret : -20.053509481750037
Iteration [  323  ]
Obj. val : 77.99078220372624, Avg. Ret : -15.207617820298205
Iteration [  324  ]
Obj. val : 81.99366108031604, Avg. Ret : -15.894755461526218
Iteration [  325  ]
Obj. val : 80.81502735388791, Avg. Ret : -20.06405659011318
Iteration [  326  ]
Obj. val : 66.03214833304304, Avg. Ret : -15.956112995687816
Iteration [  327  ]
Obj. val : 83.91510910426621, Avg. Ret : -15.248198397158921
Iteration [  328  ]
Obj. val : 72.53859447878772, Avg. Ret : -19.79604931659911
Iteration [  329  ]
Obj. val : 83.461772401936, Avg. Ret : -15.965020802735957
Iteration [  330  ]
Obj. val : 82.91047783240704, Avg. Ret : -15.199412788455545
Iteration [  331  ]
Obj. val : 81.7883713950784, Avg. Ret : -19.882818356467716
Iteration [  332  ]
Obj. val : 84.52290768980889, Avg. Ret : -15.187612363144344
Iteration [  333  ]
Obj. val : 82.02799399174246, Avg. Ret : -16.07079561466603
Iteration [  334  ]
Obj. val : 81.97127354733831, Avg. Ret : -20.122778428041592
Iteration [  335  ]
Obj. val : 77.94159773279722, Avg. Ret : -16.17580115916419
Iteration [  336  ]
Obj. val : 83.6464462629749, Avg. Ret : -14.909338321055237
Iteration [  337  ]
Obj. val : 82.89049250075013, Avg. Ret : -19.82930680544781
Iteration [  338  ]
Obj. val : 82.47249143726238, Avg. Ret : -14.879365284334618
Iteration [  339  ]
Obj. val : 79.7347560603874, Avg. Ret : -16.427931929862908
Iteration [  340  ]
Obj. val : 81.19048412155657, Avg. Ret : -19.95102708106795
Iteration [  341  ]
Obj. val : 83.94983374552335, Avg. Ret : -14.96505295373047
Iteration [  342  ]
Obj. val : 84.43669646769357, Avg. Ret : -16.507723820878436
Iteration [  343  ]
Obj. val : 84.41744033257137, Avg. Ret : -19.590692594831292
Iteration [  344  ]
Obj. val : 85.08857886201913, Avg. Ret : -16.472228386730393
Iteration [  345  ]
Obj. val : 83.3929529353951, Avg. Ret : -15.04028314864841
Iteration [  346  ]
Obj. val : 84.42156635487281, Avg. Ret : -19.682882382712926
Iteration [  347  ]
Obj. val : 82.5413785099573, Avg. Ret : -16.525323761158976
Iteration [  348  ]
Obj. val : 83.99706621598821, Avg. Ret : -14.84159641515982
Iteration [  349  ]
Obj. val : 85.02256868521356, Avg. Ret : -19.81085404519881
Iteration [  350  ]
Obj. val : 79.87305942461143, Avg. Ret : -16.73857609725154
Iteration [  351  ]
Obj. val : 83.66777160653179, Avg. Ret : -15.0978379282212
Iteration [  352  ]
Obj. val : 83.11265627353441, Avg. Ret : -19.473314497602104
Iteration [  353  ]
Obj. val : 82.53696941382503, Avg. Ret : -17.337028320089292
Iteration [  354  ]
Obj. val : 82.54051970518498, Avg. Ret : -14.789255157826394
Iteration [  355  ]
Obj. val : 84.07960033614089, Avg. Ret : -19.68374708103978
Iteration [  356  ]
Obj. val : 85.65914736945015, Avg. Ret : -14.860159612019656
Iteration [  357  ]
Obj. val : 82.29090003143443, Avg. Ret : -16.189208281775034
Iteration [  358  ]
Obj. val : 86.85188451144052, Avg. Ret : -19.691803991412048
Iteration [  359  ]
Obj. val : 86.78426753190844, Avg. Ret : -16.9574115499449
Iteration [  360  ]
Obj. val : 78.07402580667112, Avg. Ret : -14.62816340894868
Iteration [  361  ]
Obj. val : 82.83251736598996, Avg. Ret : -19.724154222313224
Iteration [  362  ]
Obj. val : 84.1682906026776, Avg. Ret : -16.31205178886677
Iteration [  363  ]
Obj. val : 84.92468399556611, Avg. Ret : -14.652952922249037
Iteration [  364  ]
Obj. val : 83.69253443721693, Avg. Ret : -19.503105692074424
Iteration [  365  ]
Obj. val : 85.649169967749, Avg. Ret : -15.979345853166818
Iteration [  366  ]
Obj. val : 85.71370121291919, Avg. Ret : -14.719782913043375
Iteration [  367  ]
Obj. val : 86.70974862804745, Avg. Ret : -19.532291897708728
Iteration [  368  ]
Obj. val : 85.72561841219112, Avg. Ret : -16.04663894959849
Iteration [  369  ]
Obj. val : 84.60196494552146, Avg. Ret : -14.939186245540784
Iteration [  370  ]
Obj. val : 86.57741265984434, Avg. Ret : -19.433409444629802
Iteration [  371  ]
Obj. val : 86.39344310437264, Avg. Ret : -15.762644606482425
Iteration [  372  ]
Obj. val : 86.43343492278746, Avg. Ret : -14.822663568130329
Iteration [  373  ]
Obj. val : 84.83048738541873, Avg. Ret : -19.340532593534466
Iteration [  374  ]
Obj. val : 86.56613915881009, Avg. Ret : -15.06514958335651
Iteration [  375  ]
Obj. val : 85.77193311233202, Avg. Ret : -15.492082425531185
Iteration [  376  ]
Obj. val : 86.66963085084232, Avg. Ret : -19.519458175897586
Iteration [  377  ]
Obj. val : 86.0117197519105, Avg. Ret : -15.264496185611037
Iteration [  378  ]
Obj. val : 87.1001408575879, Avg. Ret : -15.067816379638982
Iteration [  379  ]
Obj. val : 85.61075826542987, Avg. Ret : -19.414596362213278
Iteration [  380  ]
Obj. val : 84.02299162642382, Avg. Ret : -14.963565389794589
Iteration [  381  ]
Obj. val : 84.95594760419982, Avg. Ret : -15.398613805008395
Iteration [  382  ]
Obj. val : 86.14990957349025, Avg. Ret : -19.273808190442395
Iteration [  383  ]
Obj. val : 87.10927643830387, Avg. Ret : -15.34416812853291
Iteration [  384  ]
Obj. val : 85.97751937060636, Avg. Ret : -14.89192424795218
Iteration [  385  ]
Obj. val : 86.05488412040465, Avg. Ret : -19.278086649215314
Iteration [  386  ]
Obj. val : 87.03188661997613, Avg. Ret : -15.670385665706023
Iteration [  387  ]
Obj. val : 85.48887168069882, Avg. Ret : -15.056958132236632
Iteration [  388  ]
Obj. val : 85.23509293848777, Avg. Ret : -19.25421762102173
Iteration [  389  ]
Obj. val : 85.72573653424055, Avg. Ret : -14.808246540084449
Iteration [  390  ]
Obj. val : 87.60942411145399, Avg. Ret : -15.936290228922143
Iteration [  391  ]
Obj. val : 85.1239406990917, Avg. Ret : -19.245403175218716
Iteration [  392  ]
Obj. val : 87.12257777167922, Avg. Ret : -16.374508198035322
Iteration [  393  ]
Obj. val : 86.59511402767869, Avg. Ret : -14.631323306087522
Iteration [  394  ]
Obj. val : 87.78899917286492, Avg. Ret : -19.2832948578019
Iteration [  395  ]
Obj. val : 86.30948483161329, Avg. Ret : -14.957327791058486
Iteration [  396  ]
Obj. val : 88.48818950932652, Avg. Ret : -16.513861721433173
Iteration [  397  ]
Obj. val : 86.40971223681892, Avg. Ret : -19.009310512633842
Iteration [  398  ]
Obj. val : 88.39051921054424, Avg. Ret : -17.320677895006764
Iteration [  399  ]
Obj. val : 87.03401918602131, Avg. Ret : -14.379146224963053
checkpoint for objective values, iteration: 400. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_3.csv
checkpoint for avg return values, iteration: 400. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_3.csv
Iteration [  400  ]
Obj. val : 88.13142134594882, Avg. Ret : -19.311484386236568
Iteration [  401  ]
Obj. val : 86.53648484690746, Avg. Ret : -15.997944067316665
Iteration [  402  ]
Obj. val : 87.3137379260801, Avg. Ret : -14.740982490759956
Iteration [  403  ]
Obj. val : 84.33142516551389, Avg. Ret : -19.06767941097624
Iteration [  404  ]
Obj. val : 87.28158103566516, Avg. Ret : -15.925082494321806
Iteration [  405  ]
Obj. val : 87.6537062939027, Avg. Ret : -14.409385367655881
Iteration [  406  ]
Obj. val : 86.12959133708429, Avg. Ret : -19.105096929915838
Iteration [  407  ]
Obj. val : 86.66902305083086, Avg. Ret : -15.231641006388424
Iteration [  408  ]
Obj. val : 87.3181653560828, Avg. Ret : -14.661105006705817
Iteration [  409  ]
Obj. val : 84.42879542075943, Avg. Ret : -19.01730174575191
Iteration [  410  ]
Obj. val : 86.77738650186225, Avg. Ret : -15.274193952526439
Iteration [  411  ]
Obj. val : 85.83795165882114, Avg. Ret : -14.671526392773307
Iteration [  412  ]
Obj. val : 87.27614768572056, Avg. Ret : -19.13323080785242
Iteration [  413  ]
Obj. val : 86.76976749359831, Avg. Ret : -14.560555371320351
Iteration [  414  ]
Obj. val : 87.5972330574017, Avg. Ret : -15.453975574886169
Iteration [  415  ]
Obj. val : 85.5794189785761, Avg. Ret : -19.051711775969608
Iteration [  416  ]
Obj. val : 84.9031344883059, Avg. Ret : -15.948889640639539
Iteration [  417  ]
Obj. val : 85.56309198270652, Avg. Ret : -14.528410336786196
Iteration [  418  ]
Obj. val : 85.10212305355115, Avg. Ret : -18.897150377456096
Iteration [  419  ]
Obj. val : 87.17936412710317, Avg. Ret : -14.393723062080003
Iteration [  420  ]
Obj. val : 85.84110111173095, Avg. Ret : -16.612753876496207
Iteration [  421  ]
Obj. val : 86.42527394044018, Avg. Ret : -18.905414039705693
Iteration [  422  ]
Obj. val : 85.45014826474612, Avg. Ret : -15.787592939771322
Iteration [  423  ]
Obj. val : 86.60206273318948, Avg. Ret : -14.650414222846482
Iteration [  424  ]
Obj. val : 85.40191697547263, Avg. Ret : -18.877329792031222
Iteration [  425  ]
Obj. val : 87.15515269634474, Avg. Ret : -14.612521920589577
Iteration [  426  ]
Obj. val : 85.61533836592649, Avg. Ret : -15.445068618034563
Iteration [  427  ]
Obj. val : 87.38328885035544, Avg. Ret : -18.748625205131034
Iteration [  428  ]
Obj. val : 84.56972015631624, Avg. Ret : -14.541571487166776
Iteration [  429  ]
Obj. val : 85.25195476908218, Avg. Ret : -15.498867617293831
Iteration [  430  ]
Obj. val : 85.11496518473159, Avg. Ret : -18.62852778026458
Iteration [  431  ]
Obj. val : 84.01155361114603, Avg. Ret : -16.119395207773916
Iteration [  432  ]
Obj. val : 85.18208269005416, Avg. Ret : -14.179587819914582
Iteration [  433  ]
Obj. val : 85.00676072538302, Avg. Ret : -18.833945632660306
Iteration [  434  ]
Obj. val : 83.81896066271332, Avg. Ret : -15.665331007362752
Iteration [  435  ]
Obj. val : 84.64379564497997, Avg. Ret : -14.477553239059594
Iteration [  436  ]
Obj. val : 85.06550019954382, Avg. Ret : -18.882442670937582
Iteration [  437  ]
Obj. val : 85.82121642789232, Avg. Ret : -14.487498063911787
Iteration [  438  ]
Obj. val : 85.21385551988047, Avg. Ret : -15.953138754128588
Iteration [  439  ]
Obj. val : 83.21040693552403, Avg. Ret : -18.830975012212647
Iteration [  440  ]
Obj. val : 84.13188362872822, Avg. Ret : -16.652267210084936
Iteration [  441  ]
Obj. val : 85.0994238764087, Avg. Ret : -14.368525018254394
Iteration [  442  ]
Obj. val : 84.31239260123145, Avg. Ret : -18.70712786274914
Iteration [  443  ]
Obj. val : 85.38749771025344, Avg. Ret : -15.652454211590962
Iteration [  444  ]
Obj. val : 85.52646834475574, Avg. Ret : -14.453345880176734
Iteration [  445  ]
Obj. val : 85.65732874992564, Avg. Ret : -18.49065104193352
Iteration [  446  ]
Obj. val : 83.44872382191153, Avg. Ret : -14.130055466680048
Iteration [  447  ]
Obj. val : 85.01764066384246, Avg. Ret : -15.987685773049282
Iteration [  448  ]
Obj. val : 83.31388883067842, Avg. Ret : -18.50658049894439
Iteration [  449  ]
Obj. val : 84.13836431899922, Avg. Ret : -16.140330651960983
Iteration [  450  ]
Obj. val : 85.77960986615487, Avg. Ret : -14.39060862271965
Iteration [  451  ]
Obj. val : 83.68663200220806, Avg. Ret : -18.561617633715944
Iteration [  452  ]
Obj. val : 82.55857163349802, Avg. Ret : -16.437704152773595
Iteration [  453  ]
Obj. val : 84.73984016955062, Avg. Ret : -14.477412274790577
Iteration [  454  ]
Obj. val : 84.96898361971495, Avg. Ret : -18.462374899410925
Iteration [  455  ]
Obj. val : 83.83113732577242, Avg. Ret : -14.193590227424492
Iteration [  456  ]
Obj. val : 85.16227208341688, Avg. Ret : -15.81367360248546
Iteration [  457  ]
Obj. val : 83.02441984931222, Avg. Ret : -18.777279039118998
Iteration [  458  ]
Obj. val : 85.70008423151164, Avg. Ret : -16.13673223867616
Iteration [  459  ]
Obj. val : 84.6637085579318, Avg. Ret : -14.05179675531352
Iteration [  460  ]
Obj. val : 84.01336452936677, Avg. Ret : -18.686051037787436
Iteration [  461  ]
Obj. val : 83.83284833686773, Avg. Ret : -16.849617776495656
Iteration [  462  ]
Obj. val : 85.3586085450737, Avg. Ret : -14.18209221796763
Iteration [  463  ]
Obj. val : 81.44864664415203, Avg. Ret : -18.571292115852977
Iteration [  464  ]
Obj. val : 81.84194219032375, Avg. Ret : -14.161792590242774
Iteration [  465  ]
Obj. val : 87.32837700605248, Avg. Ret : -15.934351811078578
Iteration [  466  ]
Obj. val : 81.27039868622882, Avg. Ret : -18.472840244416048
Iteration [  467  ]
Obj. val : 83.0782539527986, Avg. Ret : -16.545903819875367
Iteration [  468  ]
Obj. val : 83.74016952985284, Avg. Ret : -14.288316823250456
Iteration [  469  ]
Obj. val : 83.37624383455974, Avg. Ret : -18.54812708554632
Iteration [  470  ]
Obj. val : 85.06362595578673, Avg. Ret : -14.519289205702934
Iteration [  471  ]
Obj. val : 83.13877103025904, Avg. Ret : -17.0320084592773
Iteration [  472  ]
Obj. val : 81.33592994492064, Avg. Ret : -18.356456623892488
Iteration [  473  ]
Obj. val : 84.20072498224924, Avg. Ret : -14.249474068021737
Iteration [  474  ]
Obj. val : 82.30279255153403, Avg. Ret : -16.554942404793206
Iteration [  475  ]
Obj. val : 85.59102162156873, Avg. Ret : -18.430941162602128
Iteration [  476  ]
Obj. val : 85.28758239839954, Avg. Ret : -15.917997704112265
Iteration [  477  ]
Obj. val : 82.63214628623534, Avg. Ret : -14.13313358543869
Iteration [  478  ]
Obj. val : 84.00139892471164, Avg. Ret : -18.407216130861443
Iteration [  479  ]
Obj. val : 83.6858616959865, Avg. Ret : -16.159333035479438
Iteration [  480  ]
Obj. val : 83.56329596371546, Avg. Ret : -14.19626022558532
Iteration [  481  ]
Obj. val : 82.25690086411224, Avg. Ret : -18.261397335866526
Iteration [  482  ]
Obj. val : 84.60496171097591, Avg. Ret : -16.804635032647997
Iteration [  483  ]
Obj. val : 84.98029936868915, Avg. Ret : -14.295115975700487
Iteration [  484  ]
Obj. val : 84.46743562369228, Avg. Ret : -18.393015892960666
Iteration [  485  ]
Obj. val : 84.40758323554202, Avg. Ret : -13.929135926124886
Iteration [  486  ]
Obj. val : 81.91951316199754, Avg. Ret : -15.875024257142327
Iteration [  487  ]
Obj. val : 84.27344704451389, Avg. Ret : -18.01987811890197
Iteration [  488  ]
Obj. val : 82.52587769358162, Avg. Ret : -16.37357519924326
Iteration [  489  ]
Obj. val : 85.26420026548095, Avg. Ret : -14.20369487435052
Iteration [  490  ]
Obj. val : 82.98640698175181, Avg. Ret : -18.169295825943305
Iteration [  491  ]
Obj. val : 84.76010784577514, Avg. Ret : -14.176777603900844
Iteration [  492  ]
Obj. val : 81.40137918709358, Avg. Ret : -15.348509541293438
Iteration [  493  ]
Obj. val : 82.5916374987671, Avg. Ret : -18.096910080712416
Iteration [  494  ]
Obj. val : 85.26085633320822, Avg. Ret : -14.043358165018965
Iteration [  495  ]
Obj. val : 84.50287416016977, Avg. Ret : -16.124753903711003
Iteration [  496  ]
Obj. val : 84.74586946879963, Avg. Ret : -17.989254728508875
Iteration [  497  ]
Obj. val : 81.66885282006416, Avg. Ret : -15.34725671427806
Iteration [  498  ]
Obj. val : 82.40252272393441, Avg. Ret : -14.010523395233935
Iteration [  499  ]
Obj. val : 82.47223515128384, Avg. Ret : -18.2270886063415
checkpoint for objective values, iteration: 500. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_3.csv
checkpoint for objective values, iteration: 500. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_3.csv
batch = 4
inside iterator
Iteration [  0  ]
Obj. val : -23.27845737021199, Avg. Ret : -22.56310685610284
Iteration [  1  ]
Obj. val : -23.41229395782704, Avg. Ret : -22.706593912078596
Iteration [  2  ]
Obj. val : -22.741465106636547, Avg. Ret : -22.747211221334695
Iteration [  3  ]
Obj. val : -23.32623217309799, Avg. Ret : -22.667324980177373
Iteration [  4  ]
Obj. val : -22.821740955133066, Avg. Ret : -22.672953401691256
Iteration [  5  ]
Obj. val : 50.81866973373372, Avg. Ret : -22.860085878302698
Iteration [  6  ]
Obj. val : -22.95024491398761, Avg. Ret : -22.60279452775355
Iteration [  7  ]
Obj. val : -22.944771336903454, Avg. Ret : -22.77553608932194
Iteration [  8  ]
Obj. val : -22.594370614776278, Avg. Ret : -22.18504296321638
Iteration [  9  ]
Obj. val : -22.638349597730162, Avg. Ret : -22.657883704372253
Iteration [  10  ]
Obj. val : -21.915671501001274, Avg. Ret : -22.843253766780755
Iteration [  11  ]
Obj. val : -22.25485989523605, Avg. Ret : -22.888496787421523
Iteration [  12  ]
Obj. val : -22.250328314471272, Avg. Ret : -22.27378135759943
Iteration [  13  ]
Obj. val : -22.42186237899952, Avg. Ret : -22.648255978426327
Iteration [  14  ]
Obj. val : -22.477180718120643, Avg. Ret : -22.788895100906085
Iteration [  15  ]
Obj. val : -22.67869332252302, Avg. Ret : -22.63864289683183
Iteration [  16  ]
Obj. val : -21.78579114234342, Avg. Ret : -22.82468617315692
Iteration [  17  ]
Obj. val : -22.0356296182038, Avg. Ret : -22.67249766302877
Iteration [  18  ]
Obj. val : -22.560897983611305, Avg. Ret : -22.470295476123393
Iteration [  19  ]
Obj. val : -22.153178853320487, Avg. Ret : -22.45908354132368
Iteration [  20  ]
Obj. val : -21.736369163595867, Avg. Ret : -38.36804964418553
Iteration [  21  ]
Obj. val : -22.261293042442343, Avg. Ret : -16.529406482912172
Iteration [  22  ]
Obj. val : -21.9287434932812, Avg. Ret : -42.54796095950227
Iteration [  23  ]
Obj. val : -21.637743221021445, Avg. Ret : -27.31047996181149
Iteration [  24  ]
Obj. val : -21.8821014783756, Avg. Ret : -11.20615091595257
Iteration [  25  ]
Obj. val : -21.761100207748722, Avg. Ret : -32.09888992967401
Iteration [  26  ]
Obj. val : -21.62947367699374, Avg. Ret : -13.411100371045302
Iteration [  27  ]
Obj. val : -21.86308261013378, Avg. Ret : -30.472364205797035
Iteration [  28  ]
Obj. val : -21.594443522110538, Avg. Ret : -30.960192103069193
Iteration [  29  ]
Obj. val : -21.460256847014058, Avg. Ret : -22.22001143603452
Iteration [  30  ]
Obj. val : -21.499280280237418, Avg. Ret : -15.874533683260616
Iteration [  31  ]
Obj. val : -21.85878519817653, Avg. Ret : -27.875056985489767
Iteration [  32  ]
Obj. val : -21.0847346112182, Avg. Ret : -22.021139274910233
Iteration [  33  ]
Obj. val : -21.14152781726932, Avg. Ret : -27.703850673369935
Iteration [  34  ]
Obj. val : -21.33211052752379, Avg. Ret : -17.611551074150373
Iteration [  35  ]
Obj. val : -21.16532723705545, Avg. Ret : -27.10254210786523
Iteration [  36  ]
Obj. val : -21.008705072265908, Avg. Ret : -26.099178719529565
Iteration [  37  ]
Obj. val : -20.915334721886584, Avg. Ret : -21.589386884857667
Iteration [  38  ]
Obj. val : -21.396778087284954, Avg. Ret : -21.617090362862115
Iteration [  39  ]
Obj. val : -20.607249140963376, Avg. Ret : -25.56280220303564
Iteration [  40  ]
Obj. val : -20.917193038456162, Avg. Ret : -24.76126773450416
Iteration [  41  ]
Obj. val : -20.99071910516259, Avg. Ret : -22.572319594224368
Iteration [  42  ]
Obj. val : -21.08681042669879, Avg. Ret : -21.978537788872163
Iteration [  43  ]
Obj. val : -21.077948335108598, Avg. Ret : -24.984649032572573
Iteration [  44  ]
Obj. val : -20.629969433781522, Avg. Ret : -22.338482541993766
Iteration [  45  ]
Obj. val : -20.362909240190465, Avg. Ret : -22.471289226068876
Iteration [  46  ]
Obj. val : -20.519754885371444, Avg. Ret : -24.61424502937552
Iteration [  47  ]
Obj. val : -20.573124286554677, Avg. Ret : -22.410719038035225
Iteration [  48  ]
Obj. val : -20.287366917723574, Avg. Ret : -22.567715772158085
Iteration [  49  ]
Obj. val : -20.42706141509182, Avg. Ret : -24.759265904718067
Iteration [  50  ]
Obj. val : -20.404166619988146, Avg. Ret : -22.43007143616494
Iteration [  51  ]
Obj. val : -20.13966763756928, Avg. Ret : -22.136263122407996
Iteration [  52  ]
Obj. val : -20.43714364783083, Avg. Ret : -24.49593918625936
Iteration [  53  ]
Obj. val : -20.36335286215593, Avg. Ret : -22.290042936443296
Iteration [  54  ]
Obj. val : -20.436911667294744, Avg. Ret : -22.11112611757361
Iteration [  55  ]
Obj. val : -20.21868555648534, Avg. Ret : -22.383242828857657
Iteration [  56  ]
Obj. val : -20.420436744318867, Avg. Ret : -21.780722780701176
Iteration [  57  ]
Obj. val : -20.270714698361555, Avg. Ret : -22.432829332560765
Iteration [  58  ]
Obj. val : -19.587598025652806, Avg. Ret : -24.580920239518477
Iteration [  59  ]
Obj. val : -19.682926694016658, Avg. Ret : -22.035340629445002
Iteration [  60  ]
Obj. val : -19.92237984767282, Avg. Ret : -22.316849136914417
Iteration [  61  ]
Obj. val : -19.185880659248628, Avg. Ret : -24.343475739619926
Iteration [  62  ]
Obj. val : -20.012774766226983, Avg. Ret : -21.781724905884683
Iteration [  63  ]
Obj. val : -19.499505325608396, Avg. Ret : -22.309071681611858
Iteration [  64  ]
Obj. val : -20.011948440645718, Avg. Ret : -24.280346782368724
Iteration [  65  ]
Obj. val : -19.769209807738076, Avg. Ret : -21.748660291591985
Iteration [  66  ]
Obj. val : -19.197813483010044, Avg. Ret : -22.005059984087385
Iteration [  67  ]
Obj. val : -19.342430025752154, Avg. Ret : -24.25182999396546
Iteration [  68  ]
Obj. val : -19.439603762774002, Avg. Ret : -21.736871644893544
Iteration [  69  ]
Obj. val : -19.065653886039726, Avg. Ret : -21.770097523553414
Iteration [  70  ]
Obj. val : -19.68512159808656, Avg. Ret : -24.08328506610405
Iteration [  71  ]
Obj. val : -19.69414163051038, Avg. Ret : -21.886666751253934
Iteration [  72  ]
Obj. val : -19.197305854584066, Avg. Ret : -21.79302170960531
Iteration [  73  ]
Obj. val : -19.853938126503593, Avg. Ret : -24.13423912467164
Iteration [  74  ]
Obj. val : -18.568412423052518, Avg. Ret : -21.820737968820175
Iteration [  75  ]
Obj. val : -18.949889144202835, Avg. Ret : -21.912794403762895
Iteration [  76  ]
Obj. val : -19.016030827349446, Avg. Ret : -24.069132698845692
Iteration [  77  ]
Obj. val : -19.35749772814517, Avg. Ret : -21.532688788442805
Iteration [  78  ]
Obj. val : -19.153095379535994, Avg. Ret : -21.87072883168573
Iteration [  79  ]
Obj. val : -18.950738269291033, Avg. Ret : -23.94184912109061
Iteration [  80  ]
Obj. val : -18.85047878614291, Avg. Ret : -21.7939710566848
Iteration [  81  ]
Obj. val : -18.850962955284356, Avg. Ret : -21.57958533299315
Iteration [  82  ]
Obj. val : -18.976080658277862, Avg. Ret : -24.07351516184233
Iteration [  83  ]
Obj. val : -18.668209806304496, Avg. Ret : -21.73894475390992
Iteration [  84  ]
Obj. val : -18.9138785716414, Avg. Ret : -21.63266530944634
Iteration [  85  ]
Obj. val : -18.97994967922923, Avg. Ret : -23.806880514631207
Iteration [  86  ]
Obj. val : -18.284179085167487, Avg. Ret : -21.29113313743035
Iteration [  87  ]
Obj. val : -18.91131244833568, Avg. Ret : -21.536796423140274
Iteration [  88  ]
Obj. val : -18.711031583678945, Avg. Ret : -23.84254161599636
Iteration [  89  ]
Obj. val : -18.695541541686396, Avg. Ret : -21.88396374368177
Iteration [  90  ]
Obj. val : -18.097349658804653, Avg. Ret : -21.53198371962225
Iteration [  91  ]
Obj. val : -18.644402238139673, Avg. Ret : -23.731612270836845
Iteration [  92  ]
Obj. val : -18.045184453849995, Avg. Ret : -21.411961055677985
Iteration [  93  ]
Obj. val : -18.295791150418854, Avg. Ret : -21.45278108639644
Iteration [  94  ]
Obj. val : -18.320155033538732, Avg. Ret : -23.911697401459442
Iteration [  95  ]
Obj. val : -17.893373181380106, Avg. Ret : -21.577263610835086
Iteration [  96  ]
Obj. val : -17.84308429120725, Avg. Ret : -21.14015250900187
Iteration [  97  ]
Obj. val : -18.27705631811826, Avg. Ret : -23.690232836653227
Iteration [  98  ]
Obj. val : -17.646788129960086, Avg. Ret : -21.26374873924077
Iteration [  99  ]
Obj. val : -17.798556150266098, Avg. Ret : -20.866245024487686
checkpoint for objective values, iteration: 100. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_4.csv
checkpoint for avg return values, iteration: 100. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_4.csv
Iteration [  100  ]
Obj. val : -18.141564179366416, Avg. Ret : -23.506507608895753
Iteration [  101  ]
Obj. val : -17.73480658062295, Avg. Ret : -20.81375691509877
Iteration [  102  ]
Obj. val : -17.81430857625837, Avg. Ret : -21.37361458827356
Iteration [  103  ]
Obj. val : -17.54530044287601, Avg. Ret : -23.507565252971045
Iteration [  104  ]
Obj. val : -17.89553599528376, Avg. Ret : -20.589526615594558
Iteration [  105  ]
Obj. val : -17.73347220671366, Avg. Ret : -21.51517549340676
Iteration [  106  ]
Obj. val : -17.72512852109467, Avg. Ret : -23.295125423397405
Iteration [  107  ]
Obj. val : -17.29157081181892, Avg. Ret : -21.12335511647403
Iteration [  108  ]
Obj. val : -17.770831620471917, Avg. Ret : -20.940470995478286
Iteration [  109  ]
Obj. val : -17.72416704675067, Avg. Ret : -23.251287240564704
Iteration [  110  ]
Obj. val : -17.776051245844684, Avg. Ret : -20.82996243429225
Iteration [  111  ]
Obj. val : -17.611368254628566, Avg. Ret : -21.072493347308146
Iteration [  112  ]
Obj. val : -17.395138229121528, Avg. Ret : -23.365253589021904
Iteration [  113  ]
Obj. val : -17.328505068131232, Avg. Ret : -21.015259134788707
Iteration [  114  ]
Obj. val : -17.214731846947902, Avg. Ret : -21.20316063034322
Iteration [  115  ]
Obj. val : -17.24077207545578, Avg. Ret : -23.397903121822868
Iteration [  116  ]
Obj. val : -16.581578377677253, Avg. Ret : -20.680803938994515
Iteration [  117  ]
Obj. val : -17.314771669679516, Avg. Ret : -20.868865829618418
Iteration [  118  ]
Obj. val : -16.979972796499787, Avg. Ret : -23.199185869589563
Iteration [  119  ]
Obj. val : -16.720658579674648, Avg. Ret : -20.34289064377434
Iteration [  120  ]
Obj. val : -16.687269298941423, Avg. Ret : -20.743066875730833
Iteration [  121  ]
Obj. val : -16.999936041690578, Avg. Ret : -23.424304815998394
Iteration [  122  ]
Obj. val : -17.136773949582377, Avg. Ret : -20.764529830393506
Iteration [  123  ]
Obj. val : -16.498090912949046, Avg. Ret : -20.732432227625164
Iteration [  124  ]
Obj. val : -16.622505196323864, Avg. Ret : -22.936320285813967
Iteration [  125  ]
Obj. val : -17.038167466806662, Avg. Ret : -20.72384995735044
Iteration [  126  ]
Obj. val : -16.658073475404336, Avg. Ret : -20.677452699461597
Iteration [  127  ]
Obj. val : -16.35939427168399, Avg. Ret : -23.081966393192726
Iteration [  128  ]
Obj. val : -16.722667402886895, Avg. Ret : -20.725460939021904
Iteration [  129  ]
Obj. val : -16.120187735636655, Avg. Ret : -20.756025747291773
Iteration [  130  ]
Obj. val : -16.136970382415882, Avg. Ret : -23.14076970309712
Iteration [  131  ]
Obj. val : -16.160736447161042, Avg. Ret : -20.427758363327438
Iteration [  132  ]
Obj. val : -16.1666108280769, Avg. Ret : -20.568503941633985
Iteration [  133  ]
Obj. val : -16.3625229078336, Avg. Ret : -23.119684860807286
Iteration [  134  ]
Obj. val : -15.979805438947313, Avg. Ret : -20.747395788166674
Iteration [  135  ]
Obj. val : -15.975866411785587, Avg. Ret : -20.366341718540852
Iteration [  136  ]
Obj. val : -15.804188911155522, Avg. Ret : -22.94504009464713
Iteration [  137  ]
Obj. val : -16.419557390896152, Avg. Ret : -21.344433885612826
Iteration [  138  ]
Obj. val : -15.999602944272915, Avg. Ret : -19.672812998715813
Iteration [  139  ]
Obj. val : -15.981162588122602, Avg. Ret : -22.83973710886458
Iteration [  140  ]
Obj. val : -15.843181042637129, Avg. Ret : -19.74380108445216
Iteration [  141  ]
Obj. val : -16.17941206777132, Avg. Ret : -20.67381585907002
Iteration [  142  ]
Obj. val : -15.640996599612276, Avg. Ret : -22.814162299799428
Iteration [  143  ]
Obj. val : -15.833758683325579, Avg. Ret : -20.341813414829392
Iteration [  144  ]
Obj. val : -15.761975369851525, Avg. Ret : -20.155664784747945
Iteration [  145  ]
Obj. val : -15.475771431706374, Avg. Ret : -23.01635038628152
Iteration [  146  ]
Obj. val : -15.600793688468736, Avg. Ret : -19.494674960998697
Iteration [  147  ]
Obj. val : -15.661328994887267, Avg. Ret : -20.753784904146414
Iteration [  148  ]
Obj. val : -15.697330677958439, Avg. Ret : -22.70997812611056
Iteration [  149  ]
Obj. val : -15.359682378122981, Avg. Ret : -19.773589088887626
Iteration [  150  ]
Obj. val : -15.29311043742938, Avg. Ret : -20.371974793657905
Iteration [  151  ]
Obj. val : -15.691149443691582, Avg. Ret : -22.746420100565725
Iteration [  152  ]
Obj. val : -14.982952561040285, Avg. Ret : -19.92164858310569
Iteration [  153  ]
Obj. val : -14.035137196481624, Avg. Ret : -19.97538723814775
Iteration [  154  ]
Obj. val : -14.858788458753766, Avg. Ret : -22.61516003961781
Iteration [  155  ]
Obj. val : -14.823148277607208, Avg. Ret : -19.229938539556034
Iteration [  156  ]
Obj. val : -14.99927024621133, Avg. Ret : -20.472029140864585
Iteration [  157  ]
Obj. val : -14.895948683006663, Avg. Ret : -22.349166111761534
Iteration [  158  ]
Obj. val : -14.825449287614529, Avg. Ret : -19.747065173844643
Iteration [  159  ]
Obj. val : -14.49037880827208, Avg. Ret : -19.658913616241147
Iteration [  160  ]
Obj. val : -14.934566454436515, Avg. Ret : -22.485607025072724
Iteration [  161  ]
Obj. val : -14.835590192408736, Avg. Ret : -20.099761843595807
Iteration [  162  ]
Obj. val : -14.550188399235731, Avg. Ret : -19.043413096167477
Iteration [  163  ]
Obj. val : -14.231318493685981, Avg. Ret : -22.529548279811788
Iteration [  164  ]
Obj. val : -14.741109114684857, Avg. Ret : -19.56132364807279
Iteration [  165  ]
Obj. val : -14.146243603550003, Avg. Ret : -19.48306217819504
Iteration [  166  ]
Obj. val : -14.212736940394732, Avg. Ret : -22.66093712756673
Iteration [  167  ]
Obj. val : -14.724173516508728, Avg. Ret : -19.441471115757448
Iteration [  168  ]
Obj. val : -14.202449343871894, Avg. Ret : -19.278523055969625
Iteration [  169  ]
Obj. val : -14.293345325137459, Avg. Ret : -22.31627440822844
Iteration [  170  ]
Obj. val : -14.311608722278246, Avg. Ret : -19.24780953982553
Iteration [  171  ]
Obj. val : -14.282214707050167, Avg. Ret : -19.350935647814776
Iteration [  172  ]
Obj. val : -13.751707352860196, Avg. Ret : -22.466933919708723
Iteration [  173  ]
Obj. val : -13.928089719600099, Avg. Ret : -18.671730811223895
Iteration [  174  ]
Obj. val : -13.883397651489446, Avg. Ret : -19.975948476156756
Iteration [  175  ]
Obj. val : -14.231804184747459, Avg. Ret : -22.28751293679176
Iteration [  176  ]
Obj. val : -13.996708507497528, Avg. Ret : -19.672353737091722
Iteration [  177  ]
Obj. val : -14.047115296013912, Avg. Ret : -18.404882504336495
Iteration [  178  ]
Obj. val : -13.820210282639351, Avg. Ret : -22.172113378687087
Iteration [  179  ]
Obj. val : -13.68164802132747, Avg. Ret : -18.2965284237899
Iteration [  180  ]
Obj. val : -13.9019675880163, Avg. Ret : -19.766002442062224
Iteration [  181  ]
Obj. val : -13.152051167772361, Avg. Ret : -22.199654050078482
Iteration [  182  ]
Obj. val : -13.739130663709556, Avg. Ret : -19.106786655435457
Iteration [  183  ]
Obj. val : -13.839685472695468, Avg. Ret : -18.960989968847187
Iteration [  184  ]
Obj. val : -13.284599599868534, Avg. Ret : -21.971472547817918
Iteration [  185  ]
Obj. val : -13.832940108632103, Avg. Ret : -18.57313048971976
Iteration [  186  ]
Obj. val : -12.943210607008774, Avg. Ret : -19.169491421959894
Iteration [  187  ]
Obj. val : -13.31557877791164, Avg. Ret : -22.135114036882925
Iteration [  188  ]
Obj. val : -13.31566256549509, Avg. Ret : -19.140382064601887
Iteration [  189  ]
Obj. val : -13.372347724992322, Avg. Ret : -18.813666478983876
Iteration [  190  ]
Obj. val : -12.559564376757423, Avg. Ret : -22.019617006551936
Iteration [  191  ]
Obj. val : -12.99036458666113, Avg. Ret : -19.490096182090824
Iteration [  192  ]
Obj. val : -12.658241222300498, Avg. Ret : -18.132619974411575
Iteration [  193  ]
Obj. val : -12.78282086090009, Avg. Ret : -21.828625100395133
Iteration [  194  ]
Obj. val : -13.112755803278251, Avg. Ret : -18.426396793625894
Iteration [  195  ]
Obj. val : -12.893312043806233, Avg. Ret : -18.531233338117353
Iteration [  196  ]
Obj. val : -12.75158933339716, Avg. Ret : -22.09928976770143
Iteration [  197  ]
Obj. val : -12.84246701300194, Avg. Ret : -18.19723973191427
Iteration [  198  ]
Obj. val : -12.388452354977902, Avg. Ret : -18.66387804583043
Iteration [  199  ]
Obj. val : -12.664148166413307, Avg. Ret : -21.80973461065318
checkpoint for objective values, iteration: 200. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_4.csv
checkpoint for avg return values, iteration: 200. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_4.csv
Iteration [  200  ]
Obj. val : -12.061186839431034, Avg. Ret : -18.54475237806464
Iteration [  201  ]
Obj. val : -12.476471804787666, Avg. Ret : -18.767918469623165
Iteration [  202  ]
Obj. val : -12.177776710423016, Avg. Ret : -21.7858722716359
Iteration [  203  ]
Obj. val : -12.183424974627124, Avg. Ret : -18.71617451319582
Iteration [  204  ]
Obj. val : -12.322400036280849, Avg. Ret : -17.862758530470227
Iteration [  205  ]
Obj. val : -12.07548686165754, Avg. Ret : -21.74547257521764
Iteration [  206  ]
Obj. val : -12.624670493990074, Avg. Ret : -18.19247049218412
Iteration [  207  ]
Obj. val : -12.285925245360936, Avg. Ret : -18.53197659303121
Iteration [  208  ]
Obj. val : -12.21667103581847, Avg. Ret : -21.632563455913168
Iteration [  209  ]
Obj. val : -11.900419019874185, Avg. Ret : -17.77870659148479
Iteration [  210  ]
Obj. val : -12.226642401411583, Avg. Ret : -18.667993885507336
Iteration [  211  ]
Obj. val : -11.913723917514256, Avg. Ret : -21.8160643843863
Iteration [  212  ]
Obj. val : -11.899596028666808, Avg. Ret : -17.94718895471841
Iteration [  213  ]
Obj. val : -12.040620330764087, Avg. Ret : -18.100282775441084
Iteration [  214  ]
Obj. val : -11.939299831323568, Avg. Ret : -21.645043473056447
Iteration [  215  ]
Obj. val : -11.536219589503116, Avg. Ret : -17.912387696364952
Iteration [  216  ]
Obj. val : -11.61065260849464, Avg. Ret : -17.933456910336567
Iteration [  217  ]
Obj. val : -11.74953087953367, Avg. Ret : -21.416523300794665
Iteration [  218  ]
Obj. val : -11.912780298875884, Avg. Ret : -17.328815030488883
Iteration [  219  ]
Obj. val : -11.476037662921575, Avg. Ret : -18.547184146590276
Iteration [  220  ]
Obj. val : -11.7662019547033, Avg. Ret : -21.56887962698922
Iteration [  221  ]
Obj. val : -11.68406267548474, Avg. Ret : -18.45951981365295
Iteration [  222  ]
Obj. val : -11.521420512454071, Avg. Ret : -17.186023326060145
Iteration [  223  ]
Obj. val : -11.410188249649941, Avg. Ret : -21.65372785339844
Iteration [  224  ]
Obj. val : -11.310740156463117, Avg. Ret : -17.723724998204382
Iteration [  225  ]
Obj. val : -10.96864477176006, Avg. Ret : -17.987338502828777
Iteration [  226  ]
Obj. val : -11.160391624949579, Avg. Ret : -21.232148378116484
Iteration [  227  ]
Obj. val : -11.503757268787393, Avg. Ret : -17.44793438414065
Iteration [  228  ]
Obj. val : -11.010847278584432, Avg. Ret : -17.745360238101362
Iteration [  229  ]
Obj. val : -11.331624233473267, Avg. Ret : -21.33756007253708
Iteration [  230  ]
Obj. val : -11.1645151143061, Avg. Ret : -17.64080463310437
Iteration [  231  ]
Obj. val : -10.75506177645306, Avg. Ret : -17.57309085934843
Iteration [  232  ]
Obj. val : -10.95428058637848, Avg. Ret : -21.383715048185028
Iteration [  233  ]
Obj. val : -10.924481223653968, Avg. Ret : -17.293962752844976
Iteration [  234  ]
Obj. val : -10.631715267260638, Avg. Ret : -17.29482359014464
Iteration [  235  ]
Obj. val : -11.194722331645748, Avg. Ret : -21.18092216797574
Iteration [  236  ]
Obj. val : -10.994263565775842, Avg. Ret : -17.002506864228927
Iteration [  237  ]
Obj. val : -10.901239883816285, Avg. Ret : -17.74617465041462
Iteration [  238  ]
Obj. val : -10.633541948487824, Avg. Ret : -21.195312955777528
Iteration [  239  ]
Obj. val : -10.391182822009018, Avg. Ret : -16.812257825581444
Iteration [  240  ]
Obj. val : -10.533029790748138, Avg. Ret : -17.813423724142865
Iteration [  241  ]
Obj. val : -10.698260151894548, Avg. Ret : -20.96535227926964
Iteration [  242  ]
Obj. val : -10.386008124240911, Avg. Ret : -17.028644616027886
Iteration [  243  ]
Obj. val : -10.28533722480518, Avg. Ret : -17.161346349995107
Iteration [  244  ]
Obj. val : -10.052178177434731, Avg. Ret : -21.088217726537092
Iteration [  245  ]
Obj. val : -10.610066942226076, Avg. Ret : -17.14394915889863
Iteration [  246  ]
Obj. val : -10.326392234337407, Avg. Ret : -17.13089619390057
Iteration [  247  ]
Obj. val : -10.019690668295803, Avg. Ret : -20.958287947101987
Iteration [  248  ]
Obj. val : -10.18717884849871, Avg. Ret : -17.705341792119622
Iteration [  249  ]
Obj. val : -10.140561668106498, Avg. Ret : -16.6203542856651
Iteration [  250  ]
Obj. val : -9.906272927030967, Avg. Ret : -21.03202736374648
Iteration [  251  ]
Obj. val : -10.156887317054304, Avg. Ret : -17.543710101316023
Iteration [  252  ]
Obj. val : -10.004838513415072, Avg. Ret : -16.716359428768822
Iteration [  253  ]
Obj. val : -9.952395825153388, Avg. Ret : -21.008419240210156
Iteration [  254  ]
Obj. val : -9.560824086937304, Avg. Ret : -17.127342912134534
Iteration [  255  ]
Obj. val : -9.813772877478701, Avg. Ret : -16.798740458980006
Iteration [  256  ]
Obj. val : -9.915751915108649, Avg. Ret : -20.982195212509247
Iteration [  257  ]
Obj. val : -9.758755096960645, Avg. Ret : -16.29684118716157
Iteration [  258  ]
Obj. val : -9.886906120865385, Avg. Ret : -17.21969160191984
Iteration [  259  ]
Obj. val : -9.444288500023724, Avg. Ret : -20.977525304366427
Iteration [  260  ]
Obj. val : -9.697575396154491, Avg. Ret : -16.51743556954692
Iteration [  261  ]
Obj. val : -9.631280496900358, Avg. Ret : -16.91718698149382
Iteration [  262  ]
Obj. val : -9.374475480723854, Avg. Ret : -20.751404425666014
Iteration [  263  ]
Obj. val : -9.541589714239436, Avg. Ret : -16.377853554958893
Iteration [  264  ]
Obj. val : -9.630752807475478, Avg. Ret : -16.654305282260033
Iteration [  265  ]
Obj. val : -9.609651072220109, Avg. Ret : -20.703331765377303
Iteration [  266  ]
Obj. val : -9.567032262917515, Avg. Ret : -16.718524085759764
Iteration [  267  ]
Obj. val : -8.912644545074611, Avg. Ret : -16.610076724910222
Iteration [  268  ]
Obj. val : -9.17664409815092, Avg. Ret : -20.858976128122436
Iteration [  269  ]
Obj. val : -9.353789589496623, Avg. Ret : -17.090154976687273
Iteration [  270  ]
Obj. val : -9.468064219975997, Avg. Ret : -16.137854054110946
Iteration [  271  ]
Obj. val : -8.988423790481734, Avg. Ret : -20.7693934704546
Iteration [  272  ]
Obj. val : -9.308004755238795, Avg. Ret : -16.428818699432078
Iteration [  273  ]
Obj. val : -9.033380101795833, Avg. Ret : -16.314609956664878
Iteration [  274  ]
Obj. val : -8.96978055299435, Avg. Ret : -20.60852756643836
Iteration [  275  ]
Obj. val : -9.364210926116797, Avg. Ret : -16.33741724983409
Iteration [  276  ]
Obj. val : -8.7348164226931, Avg. Ret : -16.09735040198772
Iteration [  277  ]
Obj. val : -9.08992370131887, Avg. Ret : -20.476146701777107
Iteration [  278  ]
Obj. val : -8.959926686105616, Avg. Ret : -16.14163774007664
Iteration [  279  ]
Obj. val : -8.800993405471985, Avg. Ret : -16.07846239438896
Iteration [  280  ]
Obj. val : -8.404562308146001, Avg. Ret : -20.509739820704144
Iteration [  281  ]
Obj. val : -8.638958467838398, Avg. Ret : -16.224061077418824
Iteration [  282  ]
Obj. val : -8.900634838116023, Avg. Ret : -16.030924994107018
Iteration [  283  ]
Obj. val : -8.472295313266246, Avg. Ret : -20.358479595248703
Iteration [  284  ]
Obj. val : -8.722294840190663, Avg. Ret : -16.15334721153016
Iteration [  285  ]
Obj. val : -8.782478258053345, Avg. Ret : -16.27689109944461
Iteration [  286  ]
Obj. val : -8.491291928174848, Avg. Ret : -20.46549575762944
Iteration [  287  ]
Obj. val : -8.664570307845503, Avg. Ret : -15.585885207505873
Iteration [  288  ]
Obj. val : -8.636419227764558, Avg. Ret : -16.380929131278855
Iteration [  289  ]
Obj. val : -8.619465662873921, Avg. Ret : -20.286209335375318
Iteration [  290  ]
Obj. val : -8.443435979960512, Avg. Ret : -15.362657791331054
Iteration [  291  ]
Obj. val : -8.484153460212328, Avg. Ret : -16.3169415147542
Iteration [  292  ]
Obj. val : -8.440799458634721, Avg. Ret : -20.379416382064395
Iteration [  293  ]
Obj. val : -7.985052287835513, Avg. Ret : -16.42125980942724
Iteration [  294  ]
Obj. val : -8.357136321065923, Avg. Ret : -15.183604430659242
Iteration [  295  ]
Obj. val : -8.33250420235503, Avg. Ret : -20.379467592750945
Iteration [  296  ]
Obj. val : -8.129183296741024, Avg. Ret : -15.51674636031256
Iteration [  297  ]
Obj. val : -8.302432474703787, Avg. Ret : -15.58714364606609
Iteration [  298  ]
Obj. val : -8.205845207497958, Avg. Ret : -20.10493262125461
Iteration [  299  ]
Obj. val : -8.187188438883053, Avg. Ret : -15.197850944421587
checkpoint for objective values, iteration: 300. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_4.csv
checkpoint for avg return values, iteration: 300. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_4.csv
Iteration [  300  ]
Obj. val : -8.361122119376438, Avg. Ret : -16.16887932616552
Iteration [  301  ]
Obj. val : -7.980743040821846, Avg. Ret : -20.35564919173482
Iteration [  302  ]
Obj. val : -8.17001827044255, Avg. Ret : -15.375030483518163
Iteration [  303  ]
Obj. val : -8.105207070932718, Avg. Ret : -15.548835105104658
Iteration [  304  ]
Obj. val : -7.966773635379503, Avg. Ret : -20.169369340739443
Iteration [  305  ]
Obj. val : -7.729977001870465, Avg. Ret : -15.41426653111622
Iteration [  306  ]
Obj. val : -7.505941118275846, Avg. Ret : -15.720504633277917
Iteration [  307  ]
Obj. val : -7.7480482852791885, Avg. Ret : -20.035012402181426
Iteration [  308  ]
Obj. val : -7.737469641251845, Avg. Ret : -14.765772992174846
Iteration [  309  ]
Obj. val : -7.9848417115315655, Avg. Ret : -16.011805570379323
Iteration [  310  ]
Obj. val : -7.960031656266348, Avg. Ret : -20.01002992994463
Iteration [  311  ]
Obj. val : -7.545096088854277, Avg. Ret : -15.280520275559189
Iteration [  312  ]
Obj. val : -7.81090118987855, Avg. Ret : -15.398168700847942
Iteration [  313  ]
Obj. val : -7.6697331915137585, Avg. Ret : -19.974421495370823
Iteration [  314  ]
Obj. val : -7.516027573115057, Avg. Ret : -15.843444248786325
Iteration [  315  ]
Obj. val : -7.601517847830411, Avg. Ret : -14.623318828520782
Iteration [  316  ]
Obj. val : -7.363495068535268, Avg. Ret : -19.913263563905854
Iteration [  317  ]
Obj. val : -7.6618769529714505, Avg. Ret : -15.796786288691994
Iteration [  318  ]
Obj. val : -7.451743174420827, Avg. Ret : -14.316380382808656
Iteration [  319  ]
Obj. val : -7.2301225025215725, Avg. Ret : -19.970727341184624
Iteration [  320  ]
Obj. val : -7.374468326077556, Avg. Ret : -13.893226567990563
Iteration [  321  ]
Obj. val : -7.572536811526915, Avg. Ret : -15.949473474006561
Iteration [  322  ]
Obj. val : -7.047684195084021, Avg. Ret : -19.75246163958414
Iteration [  323  ]
Obj. val : -7.2192466642758095, Avg. Ret : -15.01747092839416
Iteration [  324  ]
Obj. val : -7.262932104639605, Avg. Ret : -14.780455701583556
Iteration [  325  ]
Obj. val : -7.066463515638964, Avg. Ret : -19.620110615822473
Iteration [  326  ]
Obj. val : -7.077652913130373, Avg. Ret : -13.652436083904943
Iteration [  327  ]
Obj. val : -7.165159070710201, Avg. Ret : -15.839992906015441
Iteration [  328  ]
Obj. val : -7.38183020542714, Avg. Ret : -19.58820878319464
Iteration [  329  ]
Obj. val : -6.869557853095712, Avg. Ret : -14.753985631263513
Iteration [  330  ]
Obj. val : -7.230315207212233, Avg. Ret : -14.508299863177925
Iteration [  331  ]
Obj. val : -6.805741942112087, Avg. Ret : -19.7549932711708
Iteration [  332  ]
Obj. val : -6.938648927420008, Avg. Ret : -15.79573268357224
Iteration [  333  ]
Obj. val : -7.0458081433325885, Avg. Ret : -13.553795983047797
Iteration [  334  ]
Obj. val : -6.992850155975706, Avg. Ret : -19.565575808586484
Iteration [  335  ]
Obj. val : -7.019170779708437, Avg. Ret : -14.555522767792478
Iteration [  336  ]
Obj. val : -6.897821377662142, Avg. Ret : -14.602879859556092
Iteration [  337  ]
Obj. val : -6.8893132163337345, Avg. Ret : -19.59851567552158
Iteration [  338  ]
Obj. val : -6.700984423430872, Avg. Ret : -14.087208074388148
Iteration [  339  ]
Obj. val : -6.82500430991946, Avg. Ret : -14.511951506865604
Iteration [  340  ]
Obj. val : -6.691691630364239, Avg. Ret : -19.361847576342868
Iteration [  341  ]
Obj. val : -6.4690696550785765, Avg. Ret : -14.845566174142697
Iteration [  342  ]
Obj. val : -6.679533074619696, Avg. Ret : -13.193081095441432
Iteration [  343  ]
Obj. val : -6.9692310632900725, Avg. Ret : -19.428664934813252
Iteration [  344  ]
Obj. val : -6.71492732496137, Avg. Ret : -14.868247003263615
Iteration [  345  ]
Obj. val : -6.639504280023751, Avg. Ret : -13.17326975535058
Iteration [  346  ]
Obj. val : -6.482386362816021, Avg. Ret : -19.498513448397418
Iteration [  347  ]
Obj. val : -6.547776937569023, Avg. Ret : -14.57766885989985
Iteration [  348  ]
Obj. val : -6.406422487731302, Avg. Ret : -13.105703034217031
Iteration [  349  ]
Obj. val : -6.501854253705611, Avg. Ret : -19.106770598585296
Iteration [  350  ]
Obj. val : -6.638706456370065, Avg. Ret : -12.857105171232204
Iteration [  351  ]
Obj. val : -6.487335572920687, Avg. Ret : -14.729963354672064
Iteration [  352  ]
Obj. val : -6.514120218274393, Avg. Ret : -19.3599927091702
Iteration [  353  ]
Obj. val : -6.23069377588396, Avg. Ret : -13.485864617484781
Iteration [  354  ]
Obj. val : -6.728293597689394, Avg. Ret : -13.606223206234652
Iteration [  355  ]
Obj. val : -6.392697984987614, Avg. Ret : -19.320346088085017
Iteration [  356  ]
Obj. val : -6.105914625379335, Avg. Ret : -13.52744323730268
Iteration [  357  ]
Obj. val : -6.307904698084538, Avg. Ret : -13.546731883766281
Iteration [  358  ]
Obj. val : -6.424710394829551, Avg. Ret : -19.22106340674613
Iteration [  359  ]
Obj. val : -6.286557944508169, Avg. Ret : -12.744696980395753
Iteration [  360  ]
Obj. val : -6.190814847910887, Avg. Ret : -14.348756908354597
Iteration [  361  ]
Obj. val : -6.04881368838774, Avg. Ret : -19.10533664311506
Iteration [  362  ]
Obj. val : -6.299921748178563, Avg. Ret : -13.440115512541043
Iteration [  363  ]
Obj. val : -6.199097886217472, Avg. Ret : -13.179296026910299
Iteration [  364  ]
Obj. val : -6.084483829403829, Avg. Ret : -19.2040630418991
Iteration [  365  ]
Obj. val : -5.950141503779721, Avg. Ret : -12.205329207297728
Iteration [  366  ]
Obj. val : -5.981550539679651, Avg. Ret : -14.18736959221356
Iteration [  367  ]
Obj. val : -5.96522112946849, Avg. Ret : -19.078480908453805
Iteration [  368  ]
Obj. val : -5.893732102577069, Avg. Ret : -13.051397001933365
Iteration [  369  ]
Obj. val : -5.661491634139287, Avg. Ret : -13.237790560711503
Iteration [  370  ]
Obj. val : -6.155438819965473, Avg. Ret : -18.91525451951631
Iteration [  371  ]
Obj. val : -5.8842299003863365, Avg. Ret : -12.829849455497264
Iteration [  372  ]
Obj. val : -5.979426000738582, Avg. Ret : -13.183550837574268
Iteration [  373  ]
Obj. val : -6.184893329704155, Avg. Ret : -18.97357296332504
Iteration [  374  ]
Obj. val : -5.87768670369154, Avg. Ret : -12.889933386932972
Iteration [  375  ]
Obj. val : -6.012203063818728, Avg. Ret : -12.994318730368303
Iteration [  376  ]
Obj. val : -5.6861024650557095, Avg. Ret : -18.887526030014847
Iteration [  377  ]
Obj. val : -5.836823923902852, Avg. Ret : -12.699216376486312
Iteration [  378  ]
Obj. val : -5.6385884960543, Avg. Ret : -12.880580940875756
Iteration [  379  ]
Obj. val : -5.705706114076816, Avg. Ret : -18.909800206951246
Iteration [  380  ]
Obj. val : -5.704608573284186, Avg. Ret : -12.100179572339027
Iteration [  381  ]
Obj. val : -5.58564038974195, Avg. Ret : -13.319371370581296
Iteration [  382  ]
Obj. val : -5.708597561484273, Avg. Ret : -18.614832312956857
Iteration [  383  ]
Obj. val : -5.749019494700009, Avg. Ret : -12.62210874341474
Iteration [  384  ]
Obj. val : -5.675484994480353, Avg. Ret : -12.699988311342128
Iteration [  385  ]
Obj. val : -5.2826296793809995, Avg. Ret : -18.581956116045873
Iteration [  386  ]
Obj. val : -5.688983080747858, Avg. Ret : -12.602266186844457
Iteration [  387  ]
Obj. val : -5.660614428374964, Avg. Ret : -12.702325489830443
Iteration [  388  ]
Obj. val : -5.586077623798511, Avg. Ret : -18.47379470872397
Iteration [  389  ]
Obj. val : -5.731161729256214, Avg. Ret : -12.426964052857791
Iteration [  390  ]
Obj. val : -5.504016832310834, Avg. Ret : -12.460082527587165
Iteration [  391  ]
Obj. val : -5.46759775001502, Avg. Ret : -18.51941416669481
Iteration [  392  ]
Obj. val : -5.500918967986821, Avg. Ret : -12.463127026854536
Iteration [  393  ]
Obj. val : -5.403277765629452, Avg. Ret : -12.573292109221972
Iteration [  394  ]
Obj. val : -5.286527659775782, Avg. Ret : -18.55518971835485
Iteration [  395  ]
Obj. val : -5.449416154527157, Avg. Ret : -11.711997329006604
Iteration [  396  ]
Obj. val : -5.544044175117749, Avg. Ret : -13.089896797689555
Iteration [  397  ]
Obj. val : -5.337025505387635, Avg. Ret : -18.367104358483886
Iteration [  398  ]
Obj. val : -5.429899256188958, Avg. Ret : -12.244907322298317
Iteration [  399  ]
Obj. val : -5.385137757361498, Avg. Ret : -12.236610261285362
checkpoint for objective values, iteration: 400. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_4.csv
checkpoint for avg return values, iteration: 400. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_4.csv
Iteration [  400  ]
Obj. val : -5.56120994460901, Avg. Ret : -18.511727977743295
Iteration [  401  ]
Obj. val : -5.531021053681513, Avg. Ret : -12.816778464059407
Iteration [  402  ]
Obj. val : -5.386143505654824, Avg. Ret : -11.447856317412507
Iteration [  403  ]
Obj. val : -5.36710896527296, Avg. Ret : -18.339804996604556
Iteration [  404  ]
Obj. val : -5.19481727377279, Avg. Ret : -12.252280823015813
Iteration [  405  ]
Obj. val : -5.250679853328235, Avg. Ret : -12.205926199436883
Iteration [  406  ]
Obj. val : -5.237529998253213, Avg. Ret : -18.42021379120869
Iteration [  407  ]
Obj. val : -5.352540837514049, Avg. Ret : -12.037357245201227
Iteration [  408  ]
Obj. val : -5.319343723446424, Avg. Ret : -12.101893460661577
Iteration [  409  ]
Obj. val : -5.081117998155413, Avg. Ret : -18.451826931439403
Iteration [  410  ]
Obj. val : -5.1607614779729, Avg. Ret : -12.045654628228931
Iteration [  411  ]
Obj. val : -5.237955943340568, Avg. Ret : -12.064820426810245
Iteration [  412  ]
Obj. val : -5.169150206093287, Avg. Ret : -18.09338612878692
Iteration [  413  ]
Obj. val : -5.218205345112348, Avg. Ret : -11.89655277725321
Iteration [  414  ]
Obj. val : -5.174730702512337, Avg. Ret : -11.92846897716782
Iteration [  415  ]
Obj. val : -5.161562316394966, Avg. Ret : -18.338560140452678
Iteration [  416  ]
Obj. val : -5.016203070317706, Avg. Ret : -11.478716569104295
Iteration [  417  ]
Obj. val : -5.059925402846218, Avg. Ret : -12.267226161444123
Iteration [  418  ]
Obj. val : -5.083937229324148, Avg. Ret : -18.175512227673025
Iteration [  419  ]
Obj. val : -4.833250057348858, Avg. Ret : -11.84868189032409
Iteration [  420  ]
Obj. val : -5.134689433400578, Avg. Ret : -11.92133062820613
Iteration [  421  ]
Obj. val : -5.064582829603893, Avg. Ret : -17.88280107961202
Iteration [  422  ]
Obj. val : -5.087797070273205, Avg. Ret : -11.752375448568047
Iteration [  423  ]
Obj. val : -5.011821159330114, Avg. Ret : -11.825333919312317
Iteration [  424  ]
Obj. val : -4.891290688710801, Avg. Ret : -17.94960384289247
Iteration [  425  ]
Obj. val : -4.980679168543045, Avg. Ret : -11.82289428781832
Iteration [  426  ]
Obj. val : -4.759189764544246, Avg. Ret : -11.700041781805293
Iteration [  427  ]
Obj. val : -4.984122162543658, Avg. Ret : -17.913112925458098
Iteration [  428  ]
Obj. val : -4.719133647496438, Avg. Ret : -11.626982539958226
Iteration [  429  ]
Obj. val : -4.828275033741681, Avg. Ret : -11.719579398402752
Iteration [  430  ]
Obj. val : -4.87405238800357, Avg. Ret : -17.75519936059617
Iteration [  431  ]
Obj. val : -4.901708087108931, Avg. Ret : -11.634873424249047
Iteration [  432  ]
Obj. val : -4.6623874633705045, Avg. Ret : -11.517758258371398
Iteration [  433  ]
Obj. val : -4.897756328552362, Avg. Ret : -17.69424372260232
Iteration [  434  ]
Obj. val : -4.668989355942193, Avg. Ret : -11.563181400363899
Iteration [  435  ]
Obj. val : -4.75139281094432, Avg. Ret : -11.642523800387018
Iteration [  436  ]
Obj. val : -4.784039841712332, Avg. Ret : -17.623941199970893
Iteration [  437  ]
Obj. val : -4.64550634355741, Avg. Ret : -11.950015914491969
Iteration [  438  ]
Obj. val : -4.7279043335675075, Avg. Ret : -11.285052034340906
Iteration [  439  ]
Obj. val : -4.642818276678362, Avg. Ret : -17.57493748158296
Iteration [  440  ]
Obj. val : -4.787323113807986, Avg. Ret : -11.407977891692942
Iteration [  441  ]
Obj. val : -4.587329924941223, Avg. Ret : -11.398845207212513
Iteration [  442  ]
Obj. val : -4.5559792266668016, Avg. Ret : -17.56489619836325
Iteration [  443  ]
Obj. val : -4.626731784170313, Avg. Ret : -11.890102810531243
Iteration [  444  ]
Obj. val : -4.696755435757414, Avg. Ret : -10.772762388088065
Iteration [  445  ]
Obj. val : -4.575373108056704, Avg. Ret : -17.696381837772677
Iteration [  446  ]
Obj. val : -4.545469656671427, Avg. Ret : -10.711890725237758
Iteration [  447  ]
Obj. val : -4.617618224353914, Avg. Ret : -12.00661889781375
Iteration [  448  ]
Obj. val : -4.602047312977426, Avg. Ret : -17.743647782942485
Iteration [  449  ]
Obj. val : -4.538838234074941, Avg. Ret : -11.004957909776774
Iteration [  450  ]
Obj. val : -4.569826101236361, Avg. Ret : -11.345153133914451
Iteration [  451  ]
Obj. val : -4.328007955550001, Avg. Ret : -17.604709987850594
Iteration [  452  ]
Obj. val : -4.6379167217813695, Avg. Ret : -10.511476722017116
Iteration [  453  ]
Obj. val : -4.650430679026274, Avg. Ret : -11.921024115524068
Iteration [  454  ]
Obj. val : -4.526114768642766, Avg. Ret : -17.403785645586378
Iteration [  455  ]
Obj. val : -4.581555209765587, Avg. Ret : -11.049148664667646
Iteration [  456  ]
Obj. val : -4.53578884541832, Avg. Ret : -11.05763074430275
Iteration [  457  ]
Obj. val : -4.2661047234567, Avg. Ret : -17.41100276614493
Iteration [  458  ]
Obj. val : -4.112919299383468, Avg. Ret : -10.820792121394852
Iteration [  459  ]
Obj. val : -4.094760910541573, Avg. Ret : -11.006186689231647
Iteration [  460  ]
Obj. val : -4.289399103520284, Avg. Ret : -17.290584434225547
Iteration [  461  ]
Obj. val : -4.405506664060181, Avg. Ret : -10.450299292401574
Iteration [  462  ]
Obj. val : -4.500501590707696, Avg. Ret : -11.378658098087302
Iteration [  463  ]
Obj. val : -4.421617425442589, Avg. Ret : -17.343300207213144
Iteration [  464  ]
Obj. val : -4.436563800701542, Avg. Ret : -10.7582129570307
Iteration [  465  ]
Obj. val : -4.38161389579439, Avg. Ret : -10.847027147200405
Iteration [  466  ]
Obj. val : -4.442194260362513, Avg. Ret : -17.29710664243702
Iteration [  467  ]
Obj. val : -4.358495747994152, Avg. Ret : -10.945916015044123
Iteration [  468  ]
Obj. val : -4.469841175960889, Avg. Ret : -10.780427826920945
Iteration [  469  ]
Obj. val : -4.3492478354031325, Avg. Ret : -17.1651483820377
Iteration [  470  ]
Obj. val : -4.257930950922415, Avg. Ret : -11.369525216206497
Iteration [  471  ]
Obj. val : -4.286621230338214, Avg. Ret : -10.199422985229052
Iteration [  472  ]
Obj. val : -4.198912967538595, Avg. Ret : -17.039626542025285
Iteration [  473  ]
Obj. val : -4.228920691729519, Avg. Ret : -10.101138354747487
Iteration [  474  ]
Obj. val : -4.308352136340713, Avg. Ret : -11.522366880442364
Iteration [  475  ]
Obj. val : -4.258490069801191, Avg. Ret : -17.077483707275494
Iteration [  476  ]
Obj. val : -4.047644514507701, Avg. Ret : -10.115408887386948
Iteration [  477  ]
Obj. val : -4.3284106563450155, Avg. Ret : -11.211967441593691
Iteration [  478  ]
Obj. val : -3.950205144057646, Avg. Ret : -16.921582572632712
Iteration [  479  ]
Obj. val : -4.296651220639082, Avg. Ret : -10.52755013892193
Iteration [  480  ]
Obj. val : -3.9910740019947366, Avg. Ret : -10.534819331682538
Iteration [  481  ]
Obj. val : -4.045710156531927, Avg. Ret : -16.9545526519665
Iteration [  482  ]
Obj. val : -4.077889270009836, Avg. Ret : -11.062406261416566
Iteration [  483  ]
Obj. val : -3.9667370505323274, Avg. Ret : -9.863577044334084
Iteration [  484  ]
Obj. val : -4.137052541727234, Avg. Ret : -16.996971362688956
Iteration [  485  ]
Obj. val : -4.011113510752843, Avg. Ret : -11.117595045924686
Iteration [  486  ]
Obj. val : -4.205952710877268, Avg. Ret : -9.653063636191323
Iteration [  487  ]
Obj. val : -3.976429581504616, Avg. Ret : -16.68099647730712
Iteration [  488  ]
Obj. val : -4.111219759174825, Avg. Ret : -10.355400122071693
Iteration [  489  ]
Obj. val : -4.130742549602265, Avg. Ret : -10.426862878947619
Iteration [  490  ]
Obj. val : -4.16631364655143, Avg. Ret : -16.836246992863195
Iteration [  491  ]
Obj. val : -4.193245035621064, Avg. Ret : -10.288825839179959
Iteration [  492  ]
Obj. val : -4.153737433843054, Avg. Ret : -10.240505349455143
Iteration [  493  ]
Obj. val : -4.008726143843059, Avg. Ret : -16.705568498084187
Iteration [  494  ]
Obj. val : -3.895743988312669, Avg. Ret : -10.633562188102776
Iteration [  495  ]
Obj. val : -3.9794992235362896, Avg. Ret : -9.533631679457223
Iteration [  496  ]
Obj. val : -4.056816306845508, Avg. Ret : -16.610144883459178
Iteration [  497  ]
Obj. val : -3.966454740965596, Avg. Ret : -10.129084688467517
Iteration [  498  ]
Obj. val : -4.06998614418845, Avg. Ret : -9.955646609111046
Iteration [  499  ]
Obj. val : -3.9844453328186678, Avg. Ret : -16.343814760204438
checkpoint for objective values, iteration: 500. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_4.csv
checkpoint for objective values, iteration: 500. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_4.csv
batch = 5
inside iterator
Iteration [  0  ]
Obj. val : 48.682301833053536, Avg. Ret : -20.272162161363966
Iteration [  1  ]
Obj. val : -22.63315055743134, Avg. Ret : -20.564414252351348
Iteration [  2  ]
Obj. val : -23.17293753433503, Avg. Ret : -20.3022092951478
Iteration [  3  ]
Obj. val : -23.19050245824033, Avg. Ret : -20.2238192730514
Iteration [  4  ]
Obj. val : -23.03214889361076, Avg. Ret : -20.40709887308802
Iteration [  5  ]
Obj. val : -23.19064275672692, Avg. Ret : -20.439464182727903
Iteration [  6  ]
Obj. val : -22.601089007451662, Avg. Ret : -20.304990408717483
Iteration [  7  ]
Obj. val : -22.57741984860749, Avg. Ret : -20.235090247525974
Iteration [  8  ]
Obj. val : -22.462351454161727, Avg. Ret : -20.544001741820622
Iteration [  9  ]
Obj. val : -22.24231126260058, Avg. Ret : -20.542546936813647
Iteration [  10  ]
Obj. val : -22.460970871400633, Avg. Ret : -20.52900993143784
Iteration [  11  ]
Obj. val : -22.349568491570306, Avg. Ret : -20.295090295768166
Iteration [  12  ]
Obj. val : -22.093600767031386, Avg. Ret : -20.174603327566565
Iteration [  13  ]
Obj. val : -22.35943600545993, Avg. Ret : -20.03976804056483
Iteration [  14  ]
Obj. val : -22.295129108245344, Avg. Ret : -20.331236268214187
Iteration [  15  ]
Obj. val : -21.958761295568387, Avg. Ret : -20.18003752728392
Iteration [  16  ]
Obj. val : -21.635233448654745, Avg. Ret : -20.19491504041585
Iteration [  17  ]
Obj. val : -21.512957553410683, Avg. Ret : -20.268998811075697
Iteration [  18  ]
Obj. val : -21.515605345286435, Avg. Ret : -20.169505500927837
Iteration [  19  ]
Obj. val : -22.25071037626135, Avg. Ret : -20.257569893138236
Iteration [  20  ]
Obj. val : -21.946471069344508, Avg. Ret : -33.93157623987374
Iteration [  21  ]
Obj. val : -22.000319325239793, Avg. Ret : -46.07846383244851
Iteration [  22  ]
Obj. val : -21.656018684467377, Avg. Ret : -10.30161993959689
Iteration [  23  ]
Obj. val : -21.41150740071326, Avg. Ret : -33.579251183439794
Iteration [  24  ]
Obj. val : -21.59274940965499, Avg. Ret : -22.07346416209181
Iteration [  25  ]
Obj. val : -21.4708677464563, Avg. Ret : -34.63532407667449
Iteration [  26  ]
Obj. val : -21.460434739529404, Avg. Ret : -12.417969770899932
Iteration [  27  ]
Obj. val : -21.34867266806302, Avg. Ret : -28.329061974980277
Iteration [  28  ]
Obj. val : -21.14039322770166, Avg. Ret : -13.633966995581439
Iteration [  29  ]
Obj. val : -21.108376646215337, Avg. Ret : -27.063708285545108
Iteration [  30  ]
Obj. val : -20.540971255182118, Avg. Ret : -24.91149492137884
Iteration [  31  ]
Obj. val : -21.15252983827721, Avg. Ret : -20.839126941752298
Iteration [  32  ]
Obj. val : -20.880273121960375, Avg. Ret : -20.60970914728172
Iteration [  33  ]
Obj. val : -20.520777288576785, Avg. Ret : -24.57936567405908
Iteration [  34  ]
Obj. val : -20.7509986903591, Avg. Ret : -25.311173002178524
Iteration [  35  ]
Obj. val : -20.453339359623204, Avg. Ret : -15.875067077214736
Iteration [  36  ]
Obj. val : -20.103675595337325, Avg. Ret : -20.341500813249397
Iteration [  37  ]
Obj. val : -20.434961912776235, Avg. Ret : -22.83893924628792
Iteration [  38  ]
Obj. val : -20.19550954076835, Avg. Ret : -16.656609122614448
Iteration [  39  ]
Obj. val : -20.325869417132445, Avg. Ret : -23.905828737241762
Iteration [  40  ]
Obj. val : -20.289447988313828, Avg. Ret : -22.65849655214125
Iteration [  41  ]
Obj. val : 51.8371408205396, Avg. Ret : -19.552150541854175
Iteration [  42  ]
Obj. val : -20.249029806322064, Avg. Ret : -20.23587271856062
Iteration [  43  ]
Obj. val : -20.479534048582646, Avg. Ret : -24.785814074393805
Iteration [  44  ]
Obj. val : -20.03325304759684, Avg. Ret : -20.068900048648743
Iteration [  45  ]
Obj. val : -20.007069939412283, Avg. Ret : -20.132914954734858
Iteration [  46  ]
Obj. val : -20.256518225048595, Avg. Ret : -24.677001075353363
Iteration [  47  ]
Obj. val : -19.948230934096436, Avg. Ret : -19.621755252185935
Iteration [  48  ]
Obj. val : -19.5472709507636, Avg. Ret : -20.424400752986852
Iteration [  49  ]
Obj. val : -19.299838555038697, Avg. Ret : -24.45780613224599
Iteration [  50  ]
Obj. val : -19.470705715893043, Avg. Ret : -19.895615850127317
Iteration [  51  ]
Obj. val : -19.488544894569706, Avg. Ret : -19.74402355286034
Iteration [  52  ]
Obj. val : -19.421346701138983, Avg. Ret : -24.55741280326746
Iteration [  53  ]
Obj. val : -18.859276794988816, Avg. Ret : -20.115957719321933
Iteration [  54  ]
Obj. val : -18.54933648390846, Avg. Ret : -19.353892950685008
Iteration [  55  ]
Obj. val : -19.392990391794754, Avg. Ret : -24.33426260578514
Iteration [  56  ]
Obj. val : -19.17104740195437, Avg. Ret : -19.66600326295542
Iteration [  57  ]
Obj. val : -18.90111473183946, Avg. Ret : -19.44812303879438
Iteration [  58  ]
Obj. val : -18.590809951072572, Avg. Ret : -24.36274184530285
Iteration [  59  ]
Obj. val : -18.84560318537459, Avg. Ret : -19.130652660978775
Iteration [  60  ]
Obj. val : -18.802933758438215, Avg. Ret : -19.89578220831412
Iteration [  61  ]
Obj. val : -18.377241135263652, Avg. Ret : -24.123940090084343
Iteration [  62  ]
Obj. val : -18.429024188677086, Avg. Ret : -19.890920674571074
Iteration [  63  ]
Obj. val : -18.347065378261455, Avg. Ret : -18.715476323421353
Iteration [  64  ]
Obj. val : -18.354435832871324, Avg. Ret : -24.24530231870187
Iteration [  65  ]
Obj. val : -17.93432078247178, Avg. Ret : -18.68966831586077
Iteration [  66  ]
Obj. val : -17.919306799884126, Avg. Ret : -19.902699351447126
Iteration [  67  ]
Obj. val : -17.821417202497045, Avg. Ret : -24.36708864455262
Iteration [  68  ]
Obj. val : -17.394950146638617, Avg. Ret : -18.426433805863574
Iteration [  69  ]
Obj. val : -17.6914143396897, Avg. Ret : -19.64485550839753
Iteration [  70  ]
Obj. val : -17.652365134485382, Avg. Ret : -24.074434447843103
Iteration [  71  ]
Obj. val : -17.714769138839962, Avg. Ret : -19.230108821922837
Iteration [  72  ]
Obj. val : -17.844339802427456, Avg. Ret : -18.844524220761844
Iteration [  73  ]
Obj. val : -18.124034120054013, Avg. Ret : -23.993874586190085
Iteration [  74  ]
Obj. val : -17.497712488898767, Avg. Ret : -18.938993253656573
Iteration [  75  ]
Obj. val : -17.403302742258948, Avg. Ret : -18.565276990168503
Iteration [  76  ]
Obj. val : -17.461046833992242, Avg. Ret : -23.753316587887138
Iteration [  77  ]
Obj. val : -17.411563073393395, Avg. Ret : -18.4416387844967
Iteration [  78  ]
Obj. val : -17.349703812889608, Avg. Ret : -18.76276441296675
Iteration [  79  ]
Obj. val : -16.517677983009342, Avg. Ret : -23.75248294534871
Iteration [  80  ]
Obj. val : -17.027182798414422, Avg. Ret : -17.779878167216758
Iteration [  81  ]
Obj. val : -17.129772313231292, Avg. Ret : -19.168075287553982
Iteration [  82  ]
Obj. val : -16.98749763258707, Avg. Ret : -23.82588828166407
Iteration [  83  ]
Obj. val : -16.650496697471077, Avg. Ret : -18.901411920981406
Iteration [  84  ]
Obj. val : -17.291927090897804, Avg. Ret : -17.850302621874427
Iteration [  85  ]
Obj. val : -16.512082842866572, Avg. Ret : -23.909795463170955
Iteration [  86  ]
Obj. val : -16.554690580619003, Avg. Ret : -18.13185282631887
Iteration [  87  ]
Obj. val : -16.755250975936743, Avg. Ret : -17.98041173366333
Iteration [  88  ]
Obj. val : -16.40764584701603, Avg. Ret : -23.686789990137484
Iteration [  89  ]
Obj. val : -16.5643512003218, Avg. Ret : -18.36982138886961
Iteration [  90  ]
Obj. val : -16.819118245730614, Avg. Ret : -18.234468308742173
Iteration [  91  ]
Obj. val : -16.414265785556804, Avg. Ret : -23.549489403199637
Iteration [  92  ]
Obj. val : -16.835351297880525, Avg. Ret : -18.43278458666468
Iteration [  93  ]
Obj. val : -16.185771391463376, Avg. Ret : -17.463239251828853
Iteration [  94  ]
Obj. val : -15.863372372453409, Avg. Ret : -23.541558477504022
Iteration [  95  ]
Obj. val : -15.878504537497527, Avg. Ret : -17.886075786133564
Iteration [  96  ]
Obj. val : -15.886378284453569, Avg. Ret : -17.672225530972895
Iteration [  97  ]
Obj. val : -16.029274930215486, Avg. Ret : -23.5104672427358
Iteration [  98  ]
Obj. val : -15.80564251614577, Avg. Ret : -17.955603991693064
Iteration [  99  ]
Obj. val : -15.7928377222075, Avg. Ret : -17.524016759426075
checkpoint for objective values, iteration: 100. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_5.csv
checkpoint for avg return values, iteration: 100. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_5.csv
Iteration [  100  ]
Obj. val : -15.91025700240765, Avg. Ret : -23.44654146578614
Iteration [  101  ]
Obj. val : -15.79194010252747, Avg. Ret : -17.86722634248059
Iteration [  102  ]
Obj. val : -15.863967646767142, Avg. Ret : -17.35230187185424
Iteration [  103  ]
Obj. val : -15.735404774033036, Avg. Ret : -23.288775551305125
Iteration [  104  ]
Obj. val : -15.049055524151322, Avg. Ret : -18.214014771752183
Iteration [  105  ]
Obj. val : -15.62674154936471, Avg. Ret : -16.750464463025214
Iteration [  106  ]
Obj. val : -15.140155903167914, Avg. Ret : -23.15522577816955
Iteration [  107  ]
Obj. val : -15.645397365189611, Avg. Ret : -17.401039329513488
Iteration [  108  ]
Obj. val : -15.215777430192986, Avg. Ret : -17.531261382931845
Iteration [  109  ]
Obj. val : -15.24274144133482, Avg. Ret : -23.039529369804892
Iteration [  110  ]
Obj. val : -15.045618353136064, Avg. Ret : -17.889703219426806
Iteration [  111  ]
Obj. val : -15.165946294607128, Avg. Ret : -16.551692600022434
Iteration [  112  ]
Obj. val : -14.832158789941388, Avg. Ret : -23.251387278237218
Iteration [  113  ]
Obj. val : -14.886276320547738, Avg. Ret : -16.366917071299635
Iteration [  114  ]
Obj. val : -14.716428934584629, Avg. Ret : -17.664955543894788
Iteration [  115  ]
Obj. val : -14.357727681841208, Avg. Ret : -23.0149265849561
Iteration [  116  ]
Obj. val : -15.13586286325157, Avg. Ret : -16.32624597545552
Iteration [  117  ]
Obj. val : -15.037367644379318, Avg. Ret : -17.514026656810255
Iteration [  118  ]
Obj. val : -15.033059756755284, Avg. Ret : -22.772450403895405
Iteration [  119  ]
Obj. val : -14.794275771697004, Avg. Ret : -16.930181960892206
Iteration [  120  ]
Obj. val : -14.428131847332198, Avg. Ret : -17.073966549637674
Iteration [  121  ]
Obj. val : -14.5328129868825, Avg. Ret : -22.76090868671465
Iteration [  122  ]
Obj. val : -13.946187546569618, Avg. Ret : -17.074548393597457
Iteration [  123  ]
Obj. val : -13.914424698588464, Avg. Ret : -16.762189328540387
Iteration [  124  ]
Obj. val : -14.597650572516816, Avg. Ret : -22.81826889667371
Iteration [  125  ]
Obj. val : -14.362027807635522, Avg. Ret : -15.987634485242122
Iteration [  126  ]
Obj. val : -14.190550233158655, Avg. Ret : -17.116276015120544
Iteration [  127  ]
Obj. val : -14.276116053884959, Avg. Ret : -22.664711752227117
Iteration [  128  ]
Obj. val : -14.021992805161501, Avg. Ret : -17.15980247133135
Iteration [  129  ]
Obj. val : -13.915255253915777, Avg. Ret : -16.034039746842303
Iteration [  130  ]
Obj. val : -13.767575802784142, Avg. Ret : -22.531241233343795
Iteration [  131  ]
Obj. val : -13.890184139553757, Avg. Ret : -15.819514107467173
Iteration [  132  ]
Obj. val : -13.50890037905997, Avg. Ret : -17.193368540343112
Iteration [  133  ]
Obj. val : -13.870322618250041, Avg. Ret : -22.601740807205015
Iteration [  134  ]
Obj. val : -13.97044301433559, Avg. Ret : -16.524926205077495
Iteration [  135  ]
Obj. val : -13.520019418033021, Avg. Ret : -16.540066262794063
Iteration [  136  ]
Obj. val : -13.495648982035025, Avg. Ret : -22.340868859379334
Iteration [  137  ]
Obj. val : -13.758496713382579, Avg. Ret : -16.07381253698159
Iteration [  138  ]
Obj. val : -13.601857330096434, Avg. Ret : -15.932934204580311
Iteration [  139  ]
Obj. val : -13.669630622685686, Avg. Ret : -22.307390156337522
Iteration [  140  ]
Obj. val : -13.342023622087432, Avg. Ret : -15.566107792091852
Iteration [  141  ]
Obj. val : -13.471738477036654, Avg. Ret : -16.682075162146035
Iteration [  142  ]
Obj. val : -13.275542667020408, Avg. Ret : -22.244730236909348
Iteration [  143  ]
Obj. val : -13.556012642557404, Avg. Ret : -16.069952460432926
Iteration [  144  ]
Obj. val : -13.10283176758344, Avg. Ret : -16.120037112096597
Iteration [  145  ]
Obj. val : -13.001465368105208, Avg. Ret : -22.1453248143386
Iteration [  146  ]
Obj. val : -13.085075539837103, Avg. Ret : -15.789143406658315
Iteration [  147  ]
Obj. val : -12.96893768056029, Avg. Ret : -16.034822104200906
Iteration [  148  ]
Obj. val : -12.953556027822994, Avg. Ret : -22.079106664722236
Iteration [  149  ]
Obj. val : -12.794661850929364, Avg. Ret : -15.641044217781573
Iteration [  150  ]
Obj. val : -12.774868989966505, Avg. Ret : -16.258709332820153
Iteration [  151  ]
Obj. val : -12.79882199522997, Avg. Ret : -22.040943220973812
Iteration [  152  ]
Obj. val : -12.96325608940138, Avg. Ret : -15.580508220708474
Iteration [  153  ]
Obj. val : -12.663967266534401, Avg. Ret : -15.731455776356256
Iteration [  154  ]
Obj. val : -12.537463416816353, Avg. Ret : -21.950216907462682
Iteration [  155  ]
Obj. val : -12.517443744231464, Avg. Ret : -16.284265923759534
Iteration [  156  ]
Obj. val : -12.636393021979622, Avg. Ret : -15.433167027626892
Iteration [  157  ]
Obj. val : -12.678832959814216, Avg. Ret : -21.8446859919507
Iteration [  158  ]
Obj. val : -12.619722341073533, Avg. Ret : -14.933094953756484
Iteration [  159  ]
Obj. val : -12.612356773644908, Avg. Ret : -16.214614386014325
Iteration [  160  ]
Obj. val : -12.58414795164298, Avg. Ret : -21.764248507662355
Iteration [  161  ]
Obj. val : -12.220197103239643, Avg. Ret : -15.41884290984555
Iteration [  162  ]
Obj. val : -11.766114970333785, Avg. Ret : -15.37105608626014
Iteration [  163  ]
Obj. val : -12.337662217439162, Avg. Ret : -19.661889780094032
Iteration [  164  ]
Obj. val : -11.994964368085656, Avg. Ret : -14.68709619815393
Iteration [  165  ]
Obj. val : -12.417229354287791, Avg. Ret : -16.047501392133736
Iteration [  166  ]
Obj. val : -12.392089106612897, Avg. Ret : -21.51906632289159
Iteration [  167  ]
Obj. val : -11.77687979290409, Avg. Ret : -15.199124033113907
Iteration [  168  ]
Obj. val : -12.16583960251167, Avg. Ret : -15.368087329317994
Iteration [  169  ]
Obj. val : -11.886690135394172, Avg. Ret : -21.7602405211282
Iteration [  170  ]
Obj. val : -11.603522359278708, Avg. Ret : -14.547082388808123
Iteration [  171  ]
Obj. val : -11.52432482622201, Avg. Ret : -15.868090518661642
Iteration [  172  ]
Obj. val : -11.296132742037607, Avg. Ret : -21.50496346212642
Iteration [  173  ]
Obj. val : -11.636502636801486, Avg. Ret : -14.735354530599528
Iteration [  174  ]
Obj. val : -11.757266584603409, Avg. Ret : -15.67873935300293
Iteration [  175  ]
Obj. val : -11.861498948299886, Avg. Ret : -21.415885614777157
Iteration [  176  ]
Obj. val : -11.154634398355764, Avg. Ret : -15.12586658109563
Iteration [  177  ]
Obj. val : -11.53371834102336, Avg. Ret : -15.037650481427503
Iteration [  178  ]
Obj. val : -11.329955795798703, Avg. Ret : -21.534779933178328
Iteration [  179  ]
Obj. val : -11.30977887573974, Avg. Ret : -14.879309268059988
Iteration [  180  ]
Obj. val : -11.2164401156546, Avg. Ret : -15.138073755707067
Iteration [  181  ]
Obj. val : -10.829385565855949, Avg. Ret : -21.235719442910554
Iteration [  182  ]
Obj. val : -11.034108717373899, Avg. Ret : -15.328617167018347
Iteration [  183  ]
Obj. val : -11.550362936240106, Avg. Ret : -14.124037780068884
Iteration [  184  ]
Obj. val : -10.975441615932827, Avg. Ret : -21.17469958649185
Iteration [  185  ]
Obj. val : -11.137573706962904, Avg. Ret : -15.170420088943036
Iteration [  186  ]
Obj. val : -10.744520141074691, Avg. Ret : -14.05920699363128
Iteration [  187  ]
Obj. val : -10.867017480692159, Avg. Ret : -20.98323665129651
Iteration [  188  ]
Obj. val : -11.203426952091501, Avg. Ret : -14.12072101104686
Iteration [  189  ]
Obj. val : -10.83868392429371, Avg. Ret : -15.035383269011383
Iteration [  190  ]
Obj. val : -10.633665424644088, Avg. Ret : -21.045451055453217
Iteration [  191  ]
Obj. val : -11.125355225194241, Avg. Ret : -14.736505575210312
Iteration [  192  ]
Obj. val : -11.152388258077945, Avg. Ret : -14.454321957497662
Iteration [  193  ]
Obj. val : -11.010580170440752, Avg. Ret : -20.854542871709
Iteration [  194  ]
Obj. val : -11.172175569935577, Avg. Ret : -14.36161187664262
Iteration [  195  ]
Obj. val : -10.956576510402476, Avg. Ret : -14.350346800326164
Iteration [  196  ]
Obj. val : -10.766544096154341, Avg. Ret : -20.699832363432964
Iteration [  197  ]
Obj. val : -10.49123022459068, Avg. Ret : -14.831532128700433
Iteration [  198  ]
Obj. val : -10.325692686413408, Avg. Ret : -13.769563579314484
Iteration [  199  ]
Obj. val : -10.101600856344026, Avg. Ret : -20.54863513137133
checkpoint for objective values, iteration: 200. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_5.csv
checkpoint for avg return values, iteration: 200. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_5.csv
Iteration [  200  ]
Obj. val : -10.430271360413034, Avg. Ret : -14.176873666593004
Iteration [  201  ]
Obj. val : -10.832120215031713, Avg. Ret : -14.162320217856532
Iteration [  202  ]
Obj. val : -10.133253639350247, Avg. Ret : -20.546133043237365
Iteration [  203  ]
Obj. val : -10.31252886692712, Avg. Ret : -14.663270607198434
Iteration [  204  ]
Obj. val : -10.660514713057621, Avg. Ret : -13.556471464804304
Iteration [  205  ]
Obj. val : -10.729589986296908, Avg. Ret : -20.63673408845052
Iteration [  206  ]
Obj. val : -10.350513473909755, Avg. Ret : -13.987942997090409
Iteration [  207  ]
Obj. val : -10.257539187678672, Avg. Ret : -14.100316942899886
Iteration [  208  ]
Obj. val : -9.929428865920942, Avg. Ret : -20.394591163661502
Iteration [  209  ]
Obj. val : -10.131748234746826, Avg. Ret : -14.298315653281334
Iteration [  210  ]
Obj. val : -10.369956366960547, Avg. Ret : -13.951778409798203
Iteration [  211  ]
Obj. val : -10.04458986284461, Avg. Ret : -20.52295203686268
Iteration [  212  ]
Obj. val : -9.665665966081578, Avg. Ret : -13.687482847934055
Iteration [  213  ]
Obj. val : -10.18772560742281, Avg. Ret : -14.450587871718719
Iteration [  214  ]
Obj. val : -9.969153630429666, Avg. Ret : -20.41646671309348
Iteration [  215  ]
Obj. val : -9.603267821034928, Avg. Ret : -13.474474886498037
Iteration [  216  ]
Obj. val : -9.928031735086595, Avg. Ret : -14.3448452357029
Iteration [  217  ]
Obj. val : -9.88998010106886, Avg. Ret : -20.13209563922675
Iteration [  218  ]
Obj. val : -9.856279191547129, Avg. Ret : -13.401570069608606
Iteration [  219  ]
Obj. val : -9.668763247370828, Avg. Ret : -14.46868471806042
Iteration [  220  ]
Obj. val : -9.539847502904982, Avg. Ret : -20.245065677065632
Iteration [  221  ]
Obj. val : -9.704395846717498, Avg. Ret : -14.150464749517859
Iteration [  222  ]
Obj. val : -9.619356788654075, Avg. Ret : -13.287478412740063
Iteration [  223  ]
Obj. val : -9.530141239728922, Avg. Ret : -20.201814650970654
Iteration [  224  ]
Obj. val : -9.92730448833675, Avg. Ret : -14.107361949343776
Iteration [  225  ]
Obj. val : -9.836431407676624, Avg. Ret : -12.85936931585426
Iteration [  226  ]
Obj. val : -9.267108026721147, Avg. Ret : -20.126911733743405
Iteration [  227  ]
Obj. val : -9.750865922812725, Avg. Ret : -12.705326373738638
Iteration [  228  ]
Obj. val : -8.68072743285909, Avg. Ret : -14.024390454541244
Iteration [  229  ]
Obj. val : -9.151851434823016, Avg. Ret : -20.075397074154086
Iteration [  230  ]
Obj. val : -9.429126576075689, Avg. Ret : -12.764236525566561
Iteration [  231  ]
Obj. val : -9.72061353707267, Avg. Ret : -13.832941544902162
Iteration [  232  ]
Obj. val : -9.343395548895344, Avg. Ret : -19.69001165451352
Iteration [  233  ]
Obj. val : -9.443063895743572, Avg. Ret : -13.143267047239817
Iteration [  234  ]
Obj. val : -9.493675225946347, Avg. Ret : -13.338223650357712
Iteration [  235  ]
Obj. val : -9.317426023306618, Avg. Ret : -19.670700228548522
Iteration [  236  ]
Obj. val : -9.156383946818641, Avg. Ret : -13.686176639018635
Iteration [  237  ]
Obj. val : -8.922532710357054, Avg. Ret : -12.609724377372004
Iteration [  238  ]
Obj. val : -9.194548178394385, Avg. Ret : -19.641219362277855
Iteration [  239  ]
Obj. val : -9.050576570585225, Avg. Ret : -12.313295362190695
Iteration [  240  ]
Obj. val : -8.964366966254786, Avg. Ret : -13.53649730912165
Iteration [  241  ]
Obj. val : -8.880469058607364, Avg. Ret : -19.703864989915182
Iteration [  242  ]
Obj. val : -8.796578862094538, Avg. Ret : -12.89269989072595
Iteration [  243  ]
Obj. val : -8.919193342380314, Avg. Ret : -12.642054914759164
Iteration [  244  ]
Obj. val : -9.054348433669333, Avg. Ret : -19.70156450317625
Iteration [  245  ]
Obj. val : -8.963335742707107, Avg. Ret : -12.050576650864821
Iteration [  246  ]
Obj. val : -8.571156053445762, Avg. Ret : -13.3374231375799
Iteration [  247  ]
Obj. val : -8.956149647957984, Avg. Ret : -19.44417911843418
Iteration [  248  ]
Obj. val : -8.48004491691137, Avg. Ret : -12.209272417226321
Iteration [  249  ]
Obj. val : -8.495579694102036, Avg. Ret : -13.38246620516647
Iteration [  250  ]
Obj. val : -8.506298001913079, Avg. Ret : -19.365181152909976
Iteration [  251  ]
Obj. val : -8.575553974943722, Avg. Ret : -12.711165841177882
Iteration [  252  ]
Obj. val : -8.742074764900222, Avg. Ret : -12.383486053450797
Iteration [  253  ]
Obj. val : -8.421668573187493, Avg. Ret : -19.26041393086772
Iteration [  254  ]
Obj. val : -8.531016382306944, Avg. Ret : -12.594631163008112
Iteration [  255  ]
Obj. val : -8.801957560524093, Avg. Ret : -12.456840899394752
Iteration [  256  ]
Obj. val : -8.434455313754935, Avg. Ret : -19.198481715902133
Iteration [  257  ]
Obj. val : -8.314541251781725, Avg. Ret : -12.273413897737475
Iteration [  258  ]
Obj. val : -8.462092653633627, Avg. Ret : -12.476438740108826
Iteration [  259  ]
Obj. val : -8.561040961255745, Avg. Ret : -19.498087028405187
Iteration [  260  ]
Obj. val : -7.92872116123178, Avg. Ret : -11.635107965667062
Iteration [  261  ]
Obj. val : -8.429499731831497, Avg. Ret : -12.815632991934216
Iteration [  262  ]
Obj. val : -8.408278234146643, Avg. Ret : -19.08493544543265
Iteration [  263  ]
Obj. val : -8.451211424794066, Avg. Ret : -12.174511544333138
Iteration [  264  ]
Obj. val : -8.196096475826124, Avg. Ret : -11.971250057749751
Iteration [  265  ]
Obj. val : -8.38239140323312, Avg. Ret : -19.02970009123192
Iteration [  266  ]
Obj. val : -8.121289764374922, Avg. Ret : -11.983407834571533
Iteration [  267  ]
Obj. val : -7.744340259522016, Avg. Ret : -12.024424739638516
Iteration [  268  ]
Obj. val : -7.976455887739972, Avg. Ret : -18.75326103428632
Iteration [  269  ]
Obj. val : -8.318248333710955, Avg. Ret : -12.484350035283121
Iteration [  270  ]
Obj. val : -8.032738518456526, Avg. Ret : -11.485465220607718
Iteration [  271  ]
Obj. val : -8.087205006400863, Avg. Ret : -18.80017376318237
Iteration [  272  ]
Obj. val : -8.013135476024532, Avg. Ret : -11.567985186560783
Iteration [  273  ]
Obj. val : -7.568686597781018, Avg. Ret : -12.217911393111072
Iteration [  274  ]
Obj. val : -7.932698915538266, Avg. Ret : -18.782098790714187
Iteration [  275  ]
Obj. val : -7.846007733000691, Avg. Ret : -11.715278762308536
Iteration [  276  ]
Obj. val : -7.621814894510618, Avg. Ret : -11.831650870169067
Iteration [  277  ]
Obj. val : -7.7023285534736345, Avg. Ret : -18.707438658229695
Iteration [  278  ]
Obj. val : -7.854840580706574, Avg. Ret : -12.225966113457801
Iteration [  279  ]
Obj. val : -7.904906994827749, Avg. Ret : -11.169989823676424
Iteration [  280  ]
Obj. val : -7.836578029115668, Avg. Ret : -18.558942986223702
Iteration [  281  ]
Obj. val : -7.943713288602547, Avg. Ret : -11.648622549485024
Iteration [  282  ]
Obj. val : -7.917394716176657, Avg. Ret : -11.598337270626645
Iteration [  283  ]
Obj. val : -7.425893376276004, Avg. Ret : -18.57013594096517
Iteration [  284  ]
Obj. val : -7.784303152196856, Avg. Ret : -11.550897646000553
Iteration [  285  ]
Obj. val : -7.653699692052483, Avg. Ret : -11.457808227499113
Iteration [  286  ]
Obj. val : -7.482797108192395, Avg. Ret : -18.558095576341444
Iteration [  287  ]
Obj. val : -7.653863196157444, Avg. Ret : -11.019500774879297
Iteration [  288  ]
Obj. val : -7.016451476354322, Avg. Ret : -11.875047150953522
Iteration [  289  ]
Obj. val : -7.584008314514026, Avg. Ret : -18.264499862718623
Iteration [  290  ]
Obj. val : -7.580806955950884, Avg. Ret : -11.506647249301906
Iteration [  291  ]
Obj. val : -7.646138854495501, Avg. Ret : -11.302983278663799
Iteration [  292  ]
Obj. val : -7.387270272771875, Avg. Ret : -18.483871470516142
Iteration [  293  ]
Obj. val : -7.293517571862326, Avg. Ret : -11.285347091514753
Iteration [  294  ]
Obj. val : -7.390343382106758, Avg. Ret : -11.422484540072317
Iteration [  295  ]
Obj. val : -7.480611675683075, Avg. Ret : -18.403475551030763
Iteration [  296  ]
Obj. val : -7.3155961846613575, Avg. Ret : -11.110859743612217
Iteration [  297  ]
Obj. val : -7.358880684583447, Avg. Ret : -11.630101754522709
Iteration [  298  ]
Obj. val : -7.3247384124300945, Avg. Ret : -18.161770360463887
Iteration [  299  ]
Obj. val : -7.1612053449736965, Avg. Ret : -11.15524019580992
checkpoint for objective values, iteration: 300. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_5.csv
checkpoint for avg return values, iteration: 300. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_5.csv
Iteration [  300  ]
Obj. val : -7.234690364735716, Avg. Ret : -11.218796202770962
Iteration [  301  ]
Obj. val : -7.290810920693154, Avg. Ret : -18.094005774578278
Iteration [  302  ]
Obj. val : -7.310376615488325, Avg. Ret : -10.885304080647677
Iteration [  303  ]
Obj. val : -7.139083612109794, Avg. Ret : -11.384671971676156
Iteration [  304  ]
Obj. val : -7.110776098811783, Avg. Ret : -18.02597948926433
Iteration [  305  ]
Obj. val : -7.417157756743817, Avg. Ret : -11.079507493340202
Iteration [  306  ]
Obj. val : -7.407178745482028, Avg. Ret : -11.179058672428248
Iteration [  307  ]
Obj. val : -7.063113838330077, Avg. Ret : -17.835160693904232
Iteration [  308  ]
Obj. val : -6.973663836368607, Avg. Ret : -10.791497874124184
Iteration [  309  ]
Obj. val : -6.601978199785613, Avg. Ret : -11.256021192229039
Iteration [  310  ]
Obj. val : -7.202027642508867, Avg. Ret : -18.106115471826858
Iteration [  311  ]
Obj. val : -6.8672437241404065, Avg. Ret : -10.914451892284573
Iteration [  312  ]
Obj. val : -6.806857120520128, Avg. Ret : -11.06736037979553
Iteration [  313  ]
Obj. val : -7.06602987993614, Avg. Ret : -17.864149538605158
Iteration [  314  ]
Obj. val : -6.767409787863058, Avg. Ret : -10.920012703976042
Iteration [  315  ]
Obj. val : -7.039309789931798, Avg. Ret : -10.92040644502965
Iteration [  316  ]
Obj. val : -6.908585366111203, Avg. Ret : -18.135612047626882
Iteration [  317  ]
Obj. val : -6.774382314545899, Avg. Ret : -11.188934454792147
Iteration [  318  ]
Obj. val : -6.895416731874392, Avg. Ret : -10.720045674704409
Iteration [  319  ]
Obj. val : -6.765672440856192, Avg. Ret : -17.71638493035921
Iteration [  320  ]
Obj. val : -6.964161511198396, Avg. Ret : -11.147312929459204
Iteration [  321  ]
Obj. val : -6.804432060356613, Avg. Ret : -10.640113610371374
Iteration [  322  ]
Obj. val : -6.951807924175061, Avg. Ret : -17.543509847806842
Iteration [  323  ]
Obj. val : -6.83449823393233, Avg. Ret : -10.808072331094227
Iteration [  324  ]
Obj. val : -6.8934846062036925, Avg. Ret : -10.841904078975325
Iteration [  325  ]
Obj. val : -6.798615055935232, Avg. Ret : -17.507149304452437
Iteration [  326  ]
Obj. val : -6.690396347375611, Avg. Ret : -10.908241860274035
Iteration [  327  ]
Obj. val : -6.78868967896525, Avg. Ret : -10.396048028628863
Iteration [  328  ]
Obj. val : -6.710159602588397, Avg. Ret : -17.356743166828906
Iteration [  329  ]
Obj. val : -6.491053084248663, Avg. Ret : -10.345656029101603
Iteration [  330  ]
Obj. val : -6.630976134688372, Avg. Ret : -10.94886539232437
Iteration [  331  ]
Obj. val : -6.830809936916946, Avg. Ret : -17.553381095663045
Iteration [  332  ]
Obj. val : -6.569499119304751, Avg. Ret : -10.59638094391328
Iteration [  333  ]
Obj. val : -6.519589279576181, Avg. Ret : -10.473253127701097
Iteration [  334  ]
Obj. val : -6.717044904513818, Avg. Ret : -17.56874127971815
Iteration [  335  ]
Obj. val : -6.677167402281358, Avg. Ret : -10.52697669614757
Iteration [  336  ]
Obj. val : -6.40823680679303, Avg. Ret : -10.494815918376819
Iteration [  337  ]
Obj. val : -6.375480391781949, Avg. Ret : -17.395611930290013
Iteration [  338  ]
Obj. val : -6.392508035269456, Avg. Ret : -10.556439382620283
Iteration [  339  ]
Obj. val : -6.627772245002015, Avg. Ret : -10.422998799690065
Iteration [  340  ]
Obj. val : -6.428983041551804, Avg. Ret : -17.13223235079115
Iteration [  341  ]
Obj. val : -6.512349680584877, Avg. Ret : -10.04926067967218
Iteration [  342  ]
Obj. val : -6.274035762379935, Avg. Ret : -10.875484901279915
Iteration [  343  ]
Obj. val : -6.4680175851401875, Avg. Ret : -17.1995400779546
Iteration [  344  ]
Obj. val : -6.463710213828871, Avg. Ret : -10.350311471848856
Iteration [  345  ]
Obj. val : -6.492547158722684, Avg. Ret : -10.554489148899837
Iteration [  346  ]
Obj. val : -6.352958502216297, Avg. Ret : -17.11582385412777
Iteration [  347  ]
Obj. val : -6.4285802486720725, Avg. Ret : -9.89118494990947
Iteration [  348  ]
Obj. val : -6.53485096016678, Avg. Ret : -10.851395539441299
Iteration [  349  ]
Obj. val : -6.1840246607127565, Avg. Ret : -17.023306489239463
Iteration [  350  ]
Obj. val : -6.166980769551015, Avg. Ret : -10.23524745784709
Iteration [  351  ]
Obj. val : -6.0443463894389735, Avg. Ret : -10.364561368166633
Iteration [  352  ]
Obj. val : -6.268617840405465, Avg. Ret : -16.796722732633356
Iteration [  353  ]
Obj. val : -6.376722291047383, Avg. Ret : -10.65579451895666
Iteration [  354  ]
Obj. val : -6.259886283315559, Avg. Ret : -9.711692477998426
Iteration [  355  ]
Obj. val : -6.3039333296489435, Avg. Ret : -17.011285380542052
Iteration [  356  ]
Obj. val : -6.000635571029532, Avg. Ret : -10.256687072740402
Iteration [  357  ]
Obj. val : -6.14315784928546, Avg. Ret : -10.197434918061724
Iteration [  358  ]
Obj. val : -6.09056159677229, Avg. Ret : -16.606780566484392
Iteration [  359  ]
Obj. val : -6.050041963189306, Avg. Ret : -10.09567198218533
Iteration [  360  ]
Obj. val : -5.932659247615715, Avg. Ret : -9.990207145377019
Iteration [  361  ]
Obj. val : -6.299495458987489, Avg. Ret : -16.86759367742098
Iteration [  362  ]
Obj. val : -6.1252666797983, Avg. Ret : -10.194366448816748
Iteration [  363  ]
Obj. val : -6.23838500780402, Avg. Ret : -10.215171271458948
Iteration [  364  ]
Obj. val : -6.10822197128806, Avg. Ret : -16.718804667226678
Iteration [  365  ]
Obj. val : -6.095903377760002, Avg. Ret : -9.74786544556742
Iteration [  366  ]
Obj. val : -5.9649106693206715, Avg. Ret : -10.416170577922369
Iteration [  367  ]
Obj. val : -5.92228375811551, Avg. Ret : -16.681926275981947
Iteration [  368  ]
Obj. val : -5.851045670116415, Avg. Ret : -10.20474169800553
Iteration [  369  ]
Obj. val : -5.91071238669091, Avg. Ret : -9.877390323405992
Iteration [  370  ]
Obj. val : -5.9899593995845795, Avg. Ret : -16.5603838761594
Iteration [  371  ]
Obj. val : -5.945207869176086, Avg. Ret : -10.162235398147438
Iteration [  372  ]
Obj. val : -5.885303141625705, Avg. Ret : -9.785978943981222
Iteration [  373  ]
Obj. val : -5.985104586599337, Avg. Ret : -16.392393563165896
Iteration [  374  ]
Obj. val : -5.785813881463068, Avg. Ret : -9.919594294449741
Iteration [  375  ]
Obj. val : -5.860458041799297, Avg. Ret : -9.981143864310884
Iteration [  376  ]
Obj. val : -5.740627526851425, Avg. Ret : -16.507469725188763
Iteration [  377  ]
Obj. val : -5.8466108829258605, Avg. Ret : -9.927093409532894
Iteration [  378  ]
Obj. val : -5.774590812506672, Avg. Ret : -9.753708987077166
Iteration [  379  ]
Obj. val : -5.843023242950782, Avg. Ret : -16.407935181558795
Iteration [  380  ]
Obj. val : -5.546876946626019, Avg. Ret : -9.51630041607748
Iteration [  381  ]
Obj. val : -5.597449821966379, Avg. Ret : -10.155118471123686
Iteration [  382  ]
Obj. val : -5.751059167966419, Avg. Ret : -16.29359362519268
Iteration [  383  ]
Obj. val : -5.711585131735202, Avg. Ret : -9.84502581608579
Iteration [  384  ]
Obj. val : -5.545941564032543, Avg. Ret : -9.845265714744434
Iteration [  385  ]
Obj. val : -5.760332497278628, Avg. Ret : -16.018301120674177
Iteration [  386  ]
Obj. val : -5.665832152740809, Avg. Ret : -9.440412139446522
Iteration [  387  ]
Obj. val : -5.578778808185779, Avg. Ret : -9.928752226555412
Iteration [  388  ]
Obj. val : -5.677099655717235, Avg. Ret : -16.28565810101045
Iteration [  389  ]
Obj. val : -5.476465967376127, Avg. Ret : -10.059254031538511
Iteration [  390  ]
Obj. val : -5.742907514178451, Avg. Ret : -9.660444219564356
Iteration [  391  ]
Obj. val : -5.846016705345742, Avg. Ret : -16.096166488358136
Iteration [  392  ]
Obj. val : -5.579836048844857, Avg. Ret : -9.62104128478208
Iteration [  393  ]
Obj. val : -5.555749028412672, Avg. Ret : -9.588307069957514
Iteration [  394  ]
Obj. val : -5.51744509553533, Avg. Ret : -16.086319194473404
Iteration [  395  ]
Obj. val : -5.615145005133718, Avg. Ret : -9.560557089912368
Iteration [  396  ]
Obj. val : -5.597134311931084, Avg. Ret : -9.792728244149474
Iteration [  397  ]
Obj. val : -5.493077423898232, Avg. Ret : -16.076327176413546
Iteration [  398  ]
Obj. val : -5.527960066754232, Avg. Ret : -9.769932360608365
Iteration [  399  ]
Obj. val : -5.509489556175273, Avg. Ret : -9.410176317022708
checkpoint for objective values, iteration: 400. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_5.csv
checkpoint for avg return values, iteration: 400. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_5.csv
Iteration [  400  ]
Obj. val : -5.544884344356595, Avg. Ret : -15.952087618593248
Iteration [  401  ]
Obj. val : -5.36474327654422, Avg. Ret : -9.575561632629123
Iteration [  402  ]
Obj. val : -5.202161425023849, Avg. Ret : -9.53940707552041
Iteration [  403  ]
Obj. val : -5.356240202778526, Avg. Ret : -15.918701030893555
Iteration [  404  ]
Obj. val : -5.38097527838767, Avg. Ret : -9.597188190764468
Iteration [  405  ]
Obj. val : -5.200215989123469, Avg. Ret : -9.512332515897006
Iteration [  406  ]
Obj. val : -5.593432492256014, Avg. Ret : -15.732966349883702
Iteration [  407  ]
Obj. val : -5.361236316916839, Avg. Ret : -9.187654152058137
Iteration [  408  ]
Obj. val : -5.430388635103951, Avg. Ret : -9.698354828275617
Iteration [  409  ]
Obj. val : -5.50821179283954, Avg. Ret : -15.73707822496352
Iteration [  410  ]
Obj. val : -5.31180533901888, Avg. Ret : -8.982277366303084
Iteration [  411  ]
Obj. val : -5.520229838830511, Avg. Ret : -9.729174654691207
Iteration [  412  ]
Obj. val : -5.326695489505893, Avg. Ret : -15.91184365421675
Iteration [  413  ]
Obj. val : -5.208427428428797, Avg. Ret : -9.7806037303602
Iteration [  414  ]
Obj. val : -5.25108088740559, Avg. Ret : -8.879209907956042
Iteration [  415  ]
Obj. val : -5.311784453516213, Avg. Ret : -15.649333049115244
Iteration [  416  ]
Obj. val : -5.319166886375536, Avg. Ret : -9.686272577330158
Iteration [  417  ]
Obj. val : -5.164965326385576, Avg. Ret : -9.062086791890412
Iteration [  418  ]
Obj. val : -5.194759447400024, Avg. Ret : -15.553548732793494
Iteration [  419  ]
Obj. val : -5.3295869409059895, Avg. Ret : -9.332778894215732
Iteration [  420  ]
Obj. val : -5.104750118200774, Avg. Ret : -9.185717908886975
Iteration [  421  ]
Obj. val : -5.2557136267007145, Avg. Ret : -15.573241402158068
Iteration [  422  ]
Obj. val : -5.172860845636477, Avg. Ret : -9.759632937626696
Iteration [  423  ]
Obj. val : -5.37976946003327, Avg. Ret : -8.777359773483033
Iteration [  424  ]
Obj. val : -4.859880818118252, Avg. Ret : -15.59400004960994
Iteration [  425  ]
Obj. val : -5.239494657016686, Avg. Ret : -9.252947468738093
Iteration [  426  ]
Obj. val : -5.121106380039263, Avg. Ret : -9.154910714340737
Iteration [  427  ]
Obj. val : -5.027825992091809, Avg. Ret : -15.517637520519381
Iteration [  428  ]
Obj. val : -5.051616197763131, Avg. Ret : -9.78282657267654
Iteration [  429  ]
Obj. val : -5.153913210623459, Avg. Ret : -8.539133049534888
Iteration [  430  ]
Obj. val : -5.220220026524596, Avg. Ret : -15.483275545590045
Iteration [  431  ]
Obj. val : -5.333905161541503, Avg. Ret : -8.479871874508008
Iteration [  432  ]
Obj. val : -5.102218951772089, Avg. Ret : -9.507793085366881
Iteration [  433  ]
Obj. val : -4.982596141535642, Avg. Ret : -15.452857640497541
Iteration [  434  ]
Obj. val : -4.975586621947923, Avg. Ret : -8.822368810195025
Iteration [  435  ]
Obj. val : -4.956928914286718, Avg. Ret : -8.987681172678768
Iteration [  436  ]
Obj. val : -4.974740266753551, Avg. Ret : -15.242619336538615
Iteration [  437  ]
Obj. val : -5.03283932399231, Avg. Ret : -9.39508196580005
Iteration [  438  ]
Obj. val : -5.173438812033479, Avg. Ret : -8.451040514990806
Iteration [  439  ]
Obj. val : -5.021053726211294, Avg. Ret : -15.167606951070963
Iteration [  440  ]
Obj. val : -4.942752477064034, Avg. Ret : -9.351856739412858
Iteration [  441  ]
Obj. val : -5.095941612398506, Avg. Ret : -8.323481947385458
Iteration [  442  ]
Obj. val : -4.908645425559218, Avg. Ret : -15.206788721730064
Iteration [  443  ]
Obj. val : -5.01520651097417, Avg. Ret : -8.331396640182572
Iteration [  444  ]
Obj. val : -4.83557078532438, Avg. Ret : -9.406859705924001
Iteration [  445  ]
Obj. val : -4.86519547791781, Avg. Ret : -15.104031508068694
Iteration [  446  ]
Obj. val : -5.073186500824176, Avg. Ret : -9.090726044644988
Iteration [  447  ]
Obj. val : -4.780649128036498, Avg. Ret : -8.265564746663086
Iteration [  448  ]
Obj. val : -4.88527499619999, Avg. Ret : -14.934417313329984
Iteration [  449  ]
Obj. val : -4.869506215859401, Avg. Ret : -8.733106930700684
Iteration [  450  ]
Obj. val : -4.917371448273085, Avg. Ret : -8.537517397667903
Iteration [  451  ]
Obj. val : -4.73221084994299, Avg. Ret : -15.090854117457852
Iteration [  452  ]
Obj. val : -4.826566717095402, Avg. Ret : -8.684992624700703
Iteration [  453  ]
Obj. val : -4.773967769969917, Avg. Ret : -8.674084304430679
Iteration [  454  ]
Obj. val : -5.001962805159015, Avg. Ret : -14.818994978408696
Iteration [  455  ]
Obj. val : -4.835991500684019, Avg. Ret : -8.246190076443893
Iteration [  456  ]
Obj. val : -4.877847342685564, Avg. Ret : -9.059545617628078
Iteration [  457  ]
Obj. val : -4.731672246789124, Avg. Ret : -14.843410237014083
Iteration [  458  ]
Obj. val : -4.75473224646206, Avg. Ret : -8.128535602695777
Iteration [  459  ]
Obj. val : -4.892078485055775, Avg. Ret : -9.06176314348142
Iteration [  460  ]
Obj. val : -4.745735691257086, Avg. Ret : -14.75322986230446
Iteration [  461  ]
Obj. val : -4.69617146196511, Avg. Ret : -8.443681102750391
Iteration [  462  ]
Obj. val : -4.628463061438252, Avg. Ret : -8.490700119335367
Iteration [  463  ]
Obj. val : -4.763343109752424, Avg. Ret : -14.703860481257143
Iteration [  464  ]
Obj. val : -4.714917256287072, Avg. Ret : -8.729039067627037
Iteration [  465  ]
Obj. val : -4.65837413286912, Avg. Ret : -8.273667485792025
Iteration [  466  ]
Obj. val : -4.798368289606647, Avg. Ret : -14.581772081100754
Iteration [  467  ]
Obj. val : -4.77876274996027, Avg. Ret : -8.51327464308914
Iteration [  468  ]
Obj. val : -4.698976143181316, Avg. Ret : -8.46286689570449
Iteration [  469  ]
Obj. val : -4.45273246687385, Avg. Ret : -14.534238488190356
Iteration [  470  ]
Obj. val : -4.567395511812069, Avg. Ret : -8.685745200391727
Iteration [  471  ]
Obj. val : -4.382177923541083, Avg. Ret : -8.096530337673412
Iteration [  472  ]
Obj. val : -4.591786365239978, Avg. Ret : -14.543045418149767
Iteration [  473  ]
Obj. val : -4.646736730100079, Avg. Ret : -8.569490045808168
Iteration [  474  ]
Obj. val : -4.569660194170938, Avg. Ret : -8.061503940434909
Iteration [  475  ]
Obj. val : -4.561325835762915, Avg. Ret : -14.206191550938263
Iteration [  476  ]
Obj. val : -4.591540213896472, Avg. Ret : -8.078329251423252
Iteration [  477  ]
Obj. val : -4.493010540779822, Avg. Ret : -8.700272529380124
Iteration [  478  ]
Obj. val : -4.558046460884045, Avg. Ret : -14.38861227313986
Iteration [  479  ]
Obj. val : -4.618627820677738, Avg. Ret : -8.594564122263199
Iteration [  480  ]
Obj. val : -4.389455569263316, Avg. Ret : -7.881875926238129
Iteration [  481  ]
Obj. val : -4.641507108852416, Avg. Ret : -14.40395595243328
Iteration [  482  ]
Obj. val : -4.6620279771637, Avg. Ret : -7.944368855238126
Iteration [  483  ]
Obj. val : -4.4594708311711075, Avg. Ret : -8.499702515277669
Iteration [  484  ]
Obj. val : -4.576045771031188, Avg. Ret : -14.099085029602442
Iteration [  485  ]
Obj. val : -4.192211482456493, Avg. Ret : -7.862274672219571
Iteration [  486  ]
Obj. val : -4.593732659398893, Avg. Ret : -8.443986976647302
Iteration [  487  ]
Obj. val : -4.5942789656278356, Avg. Ret : -14.215778326270593
Iteration [  488  ]
Obj. val : -4.489823199785229, Avg. Ret : -7.9872291991674365
Iteration [  489  ]
Obj. val : -4.705608503608681, Avg. Ret : -8.066414095617386
Iteration [  490  ]
Obj. val : -4.480693425217791, Avg. Ret : -14.136034072985636
Iteration [  491  ]
Obj. val : -4.507506082972672, Avg. Ret : -8.48441188507315
Iteration [  492  ]
Obj. val : -4.562678291849306, Avg. Ret : -7.806331971893599
Iteration [  493  ]
Obj. val : -4.377866928591137, Avg. Ret : -14.130648146465374
Iteration [  494  ]
Obj. val : -4.405976315135832, Avg. Ret : -8.141589555364549
Iteration [  495  ]
Obj. val : -4.536084434730757, Avg. Ret : -7.816485594054513
Iteration [  496  ]
Obj. val : -4.479586415945727, Avg. Ret : -14.14424070727722
Iteration [  497  ]
Obj. val : -4.312381686595147, Avg. Ret : -7.712884994608864
Iteration [  498  ]
Obj. val : -4.507715103898879, Avg. Ret : -8.353525049209805
Iteration [  499  ]
Obj. val : -4.392036053954925, Avg. Ret : -14.14951170917815
checkpoint for objective values, iteration: 500. Saved at  ./tests/mountaincar/alpha_0_1/ evar_obj_5.csv
checkpoint for objective values, iteration: 500. Saved at  ./tests/mountaincar/alpha_0_1/ evar_ret_5.csv
